aboutsummaryrefslogtreecommitdiff
path: root/gnu/bootloader.scm
diff options
context:
space:
mode:
authorJohn Soo <jsoo1@asu.edu>2020-01-15 09:34:03 -0800
committerEfraim Flashner <efraim@flashner.co.il>2020-01-21 16:23:48 +0200
commit04020a73b3dea169f806d4f0d04cd2505d50efa1 (patch)
treef6c98fbe39d8b4b719d9078ef4fb658093fadfd2 /gnu/bootloader.scm
parentb2f948be9f815582a49bd80a9594a881d7d1a56e (diff)
downloadguix-04020a73b3dea169f806d4f0d04cd2505d50efa1.tar.gz
guix-04020a73b3dea169f806d4f0d04cd2505d50efa1.zip
gnu: Add rust-handlebars-2.0.
* gnu/packages/crates-io.scm (rust-handlebars-2.0): New variable. Signed-off-by: Efraim Flashner <efraim@flashner.co.il>
Diffstat (limited to 'gnu/bootloader.scm')
0 files changed, 0 insertions, 0 deletions
ot; (logior MS_NOEXEC MS_NOSUID MS_NODEV))) ;; A sysfs mount requires the user to have the CAP_SYS_ADMIN capability in ;; the current network namespace. (when mount-/sys? (mount* "none" (scope "/sys") "sysfs" (logior MS_NOEXEC MS_NOSUID MS_NODEV MS_RDONLY))) (mount* "none" (scope "/dev") "tmpfs" (logior MS_NOEXEC MS_STRICTATIME) "mode=755") ;; Create essential device nodes via bind-mounting them from the ;; host, because a process within a user namespace cannot create ;; device nodes. (for-each (lambda (device) (when (file-exists? device) ;; Create the mount point file. (touch (scope device)) (bind-mount device (scope device)))) '("/dev/null" "/dev/zero" "/dev/full" "/dev/random" "/dev/urandom" "/dev/tty" "/dev/fuse")) ;; Mount a new devpts instance on /dev/pts. (when (file-exists? "/dev/ptmx") (mount* "none" (scope "/dev/pts") "devpts" 0 "newinstance,mode=0620") (symlink "/dev/pts/ptmx" (scope "/dev/ptmx"))) ;; Setup the container's /dev/console by bind mounting the pseudo-terminal ;; associated with standard input when there is one. (let* ((in (current-input-port)) (tty (catch 'system-error (lambda () ;; This call throws if IN does not correspond to a tty. ;; This is more reliable than 'isatty?'. (ttyname in)) (const #f))) (console (scope "/dev/console"))) (when tty (touch console) (chmod console #o600) (bind-mount tty console))) ;; Setup standard input/output/error. (symlink "/proc/self/fd" (scope "/dev/fd")) (symlink "/proc/self/fd/0" (scope "/dev/stdin")) (symlink "/proc/self/fd/1" (scope "/dev/stdout")) (symlink "/proc/self/fd/2" (scope "/dev/stderr")) ;; Mount user-specified file systems. (for-each (lambda (file-system) (mount-file-system file-system #:root root)) mounts) ;; Jail the process inside the container's root file system. (let ((put-old (string-append root "/real-root"))) (mkdir put-old) (pivot-root root put-old) (chdir "/") (umount "real-root" MNT_DETACH) (rmdir "real-root") (chmod "/" #o755))) (define* (initialize-user-namespace pid host-uids #:key (guest-uid 0) (guest-gid 0)) "Configure the user namespace for PID. HOST-UIDS specifies the number of host user identifiers to map into the user namespace. GUEST-UID and GUEST-GID specify the first UID (respectively GID) that host UIDs (respectively GIDs) map to in the namespace." (define proc-dir (string-append "/proc/" (number->string pid))) (define (scope file) (string-append proc-dir file)) (let ((uid (getuid)) (gid (getgid))) ;; Only root can write to the gid map without first disabling the ;; setgroups syscall. (unless (and (zero? uid) (zero? gid)) (call-with-output-file (scope "/setgroups") (lambda (port) (display "deny" port)))) ;; Map the user/group that created the container to the root user ;; within the container. (call-with-output-file (scope "/uid_map") (lambda (port) (format port "~d ~d ~d" guest-uid uid host-uids))) (call-with-output-file (scope "/gid_map") (lambda (port) (format port "~d ~d ~d" guest-gid gid host-uids))))) (define (namespaces->bit-mask namespaces) "Return the number suitable for the 'flags' argument of 'clone' that corresponds to the symbols in NAMESPACES." ;; Use the same flags as fork(3) in addition to the namespace flags. (apply logior SIGCHLD (map (match-lambda ('cgroup CLONE_NEWCGROUP) ('mnt CLONE_NEWNS) ('uts CLONE_NEWUTS) ('ipc CLONE_NEWIPC) ('user CLONE_NEWUSER) ('pid CLONE_NEWPID) ('net CLONE_NEWNET)) namespaces))) (define* (run-container root mounts namespaces host-uids thunk #:key (guest-uid 0) (guest-gid 0)) "Run THUNK in a new container process and return its PID. ROOT specifies the root directory for the container. MOUNTS is a list of <file-system> objects that specify file systems to mount inside the container. NAMESPACES is a list of symbols that correspond to the possible Linux namespaces: mnt, ipc, uts, user, and net. HOST-UIDS specifies the number of host user identifiers to map into the user namespace. GUEST-UID and GUEST-GID specify the first UID (respectively GID) that host UIDs (respectively GIDs) map to in the namespace." ;; The parent process must initialize the user namespace for the child ;; before it can boot. To negotiate this, a pipe is used such that the ;; child process blocks until the parent writes to it. (match (socketpair PF_UNIX (logior SOCK_CLOEXEC SOCK_STREAM) 0) ((child . parent) (let ((flags (namespaces->bit-mask namespaces))) (match (clone flags) (0 (call-with-clean-exit (lambda () (close-port parent) ;; Wait for parent to set things up. (match (read child) ('ready (purify-environment) (when (and (memq 'mnt namespaces) (not (string=? root "/"))) (catch #t (lambda () (mount-file-systems root mounts #:mount-/proc? (memq 'pid namespaces) #:mount-/sys? (memq 'net namespaces))) (lambda args ;; Forward the exception to the parent process. ;; FIXME: SRFI-35 conditions and non-trivial objects ;; cannot be 'read' so they shouldn't be written as is. (write args child) (primitive-exit 3)))) ;; TODO: Manage capabilities. (write 'ready child) (close-port child) (thunk)) (_ ;parent died or something (primitive-exit 2)))))) (pid (close-port child) (when (memq 'user namespaces) (initialize-user-namespace pid host-uids #:guest-uid guest-uid #:guest-gid guest-gid)) ;; TODO: Initialize cgroups. (write 'ready parent) (newline parent) ;; Check whether the child process' setup phase succeeded. (let ((message (read parent))) (close-port parent) (match message ('ready ;success pid) (((? symbol? key) args ...) ;exception (apply throw key args)) (_ ;unexpected termination #f))))))))) ;; FIXME: This is copied from (guix utils), which we cannot use because it ;; would pull (guix config) and all. (define (call-with-temporary-directory proc) "Call PROC with a name of a temporary directory; close the directory and delete it when leaving the dynamic extent of this call." (let* ((directory (or (getenv "TMPDIR") "/tmp")) (template (string-append directory "/guix-directory.XXXXXX")) (tmp-dir (mkdtemp! template))) (dynamic-wind (const #t) (lambda () (proc tmp-dir)) (lambda () (false-if-exception (delete-file-recursively tmp-dir)))))) (define (wait-child-process) "Wait for one child process and return a pair, like 'waitpid', or return #f if there are no child processes left." (catch 'system-error (lambda () (waitpid WAIT_ANY)) (lambda args (if (= ECHILD (system-error-errno args)) #f (apply throw args))))) (define (status->exit-status status) "Reify STATUS as an exit status." (or (status:exit-val status) ;; See <http://www.tldp.org/LDP/abs/html/exitcodes.html#EXITCODESREF>. (+ 128 (or (status:term-sig status) (status:stop-sig status))))) (define* (call-with-container mounts thunk #:key (namespaces %namespaces) (host-uids 1) (guest-uid 0) (guest-gid 0) (relayed-signals (list SIGINT SIGTERM)) (child-is-pid1? #t) (process-spawned-hook (const #t))) "Run THUNK in a new container process and return its exit status; call PROCESS-SPAWNED-HOOK with the PID of the new process that has been spawned. MOUNTS is a list of <file-system> objects that specify file systems to mount inside the container. NAMESPACES is a list of symbols corresponding to the identifiers for Linux namespaces: mnt, ipc, uts, pid, user, and net. By default, all namespaces are used. HOST-UIDS is the number of host user identifiers to map into the container's user namespace, if there is one. By default, only a single uid/gid, that of the current user, is mapped into the container. The host user that creates the container is the root user (uid/gid 0) within the container. Only root can map more than a single uid/gid. GUEST-UID and GUEST-GID specify the first UID (respectively GID) that host UIDs (respectively GIDs) map to in the namespace. RELAYED-SIGNALS is the list of signals that are \"relayed\" to the container process when caught by its parent. When CHILD-IS-PID1? is true, and if NAMESPACES contains 'pid', then the child process runs directly as PID 1. As such, it is responsible for (1) installing signal handlers and (2) reaping terminated processes by calling 'waitpid'. When CHILD-IS-PID1? is false, a new intermediate process is created instead that takes this responsibility. Note that if THUNK needs to load any additional Guile modules, the relevant module files must be present in one of the mappings in MOUNTS and the Guile load path must be adjusted as needed." (define thunk* (if (and (memq 'pid namespaces) (not child-is-pid1?)) (lambda () ;; Behave like an init process: create a sub-process that calls ;; THUNK, and wait for child processes. Furthermore, forward ;; RELAYED-SIGNALS to the child process. (match (primitive-fork) (0 (call-with-clean-exit thunk)) (pid (install-signal-handlers pid) (let loop () (match (wait-child-process) ((child . status) (if (= child pid) (primitive-exit (status->exit-status status)) (loop))) (#f (primitive-exit 128))))))) ;cannot happen thunk)) (define (periodically-schedule-asyncs) ;; XXX: In Guile there's a time window where a signal-handling async could ;; be queued without being processed by the time we enter a blocking ;; syscall like waitpid(2) (info "(guile) Signals"). This terrible hack ;; ensures pending asyncs get a chance to run periodically. (sigaction SIGALRM (lambda _ (alarm 1))) (alarm 1)) (define (install-signal-handlers pid) ;; Install handlers that forward signals to PID. (define (relay-signal signal) (false-if-exception (kill pid signal))) (periodically-schedule-asyncs) (for-each (lambda (signal) (sigaction signal relay-signal)) relayed-signals)) (call-with-temporary-directory (lambda (root) (let ((pid (run-container root mounts namespaces host-uids thunk* #:guest-uid guest-uid #:guest-gid guest-gid))) (install-signal-handlers pid) (process-spawned-hook pid) (match (waitpid pid) ((_ . status) status)))))) (define (container-excursion pid thunk) "Run THUNK as a child process within the namespaces of process PID and return the exit status, an integer as returned by 'waitpid'." (define (namespace-file pid namespace) (string-append "/proc/" (number->string pid) "/ns/" namespace)) (match (primitive-fork) (0 (call-with-clean-exit (lambda () (for-each (lambda (ns) (let ((source (namespace-file (getpid) ns)) (target (namespace-file pid ns))) ;; Joining the namespace that the process already ;; belongs to would throw an error so avoid that. ;; XXX: This /proc interface leads to TOCTTOU. (unless (string=? (readlink source) (readlink target)) (call-with-input-file source (lambda (current-ns-port) (call-with-input-file target (lambda (new-ns-port) (setns (fileno new-ns-port) 0)))))))) ;; It's important that the user namespace is joined first, ;; so that the user will have the privileges to join the ;; other namespaces. Furthermore, it's important that the ;; mount namespace is joined last, otherwise the /proc mount ;; point would no longer be accessible. '("user" "ipc" "uts" "net" "pid" "mnt")) (purify-environment) (chdir "/") ;; Per setns(2), changing the PID namespace only applies to child ;; processes, not to the process itself. Thus fork so that THUNK runs ;; in the right PID namespace, which also gives it access to /proc. (match (primitive-fork) (0 (call-with-clean-exit thunk)) (pid (primitive-exit (match (waitpid pid) ((_ . status) (or (status:exit-val status) 127))))))))) (pid (match (waitpid pid) ((_ . status) status))))) (define (container-excursion* pid thunk) "Like 'container-excursion', but return the return value of THUNK." (match (pipe) ((in . out) ;; Make sure IN and OUT are not inherited if THUNK forks + execs. (fcntl in F_SETFD FD_CLOEXEC) (fcntl out F_SETFD FD_CLOEXEC) (match (container-excursion pid (lambda () (close-port in) (write (thunk) out) (close-port out))) (0 (close-port out) (let ((result (read in))) (close-port in) result)) (_ ;maybe PID died already (close-port out) (close-port in) #f)))))