package Sys::Linux::Namespace; # ABSTRACT: Sets up linux kernel namespaces use strict; use warnings; use Sys::Linux::Mount qw/:all/; use Sys::Linux::Unshare qw/:all/; use POSIX qw/_exit/; use Moo; use Carp qw/carp/; for my $p (qw/tmp mount pid net ipc user uts sysvsem/) { my $pp = "private_$p"; has $pp => (is => 'rw'); } has code => (is => 'rw'); # code to run in the namespace sub _uflags { my $self = shift; my $uflags = 0; $uflags |= CLONE_NEWNS if ($self->private_tmp || $self->private_mount); $uflags |= CLONE_NEWPID if ($self->private_pid); $uflags |= CLONE_NEWNET if ($self->private_net); $uflags |= CLONE_NEWIPC if ($self->private_ipc); $uflags |= CLONE_NEWUSER if ($self->private_user); $uflags |= CLONE_NEWUTS if ($self->private_uts); $uflags |= CLONE_SYSVSEM if ($self->private_sysvsem); return $uflags; } sub _subprocess { my ($self, $code, %args) = @_; die "_subprocess requires a CODE ref" unless ref $code eq 'CODE'; my $pid = fork(); carp "Failed to fork: $!" if ($pid < 0); if ($pid) { waitpid($pid, 0); # block and wait on child return $?; } else { $code->(%args); _exit(0); } } sub pre_setup { my ($self, %args) = @_; die "Private net is not yet supported" if $self->private_net; if ($self->private_pid && ((ref $self->code ne 'CODE') || (ref $args{code} ne 'CODE'))) { die "Private PID space requires a coderef to become the new PID 1"; } } sub post_setup { my ($self, %args) = @_; # If we want a private /tmp, or private mount we need to recursively make every mount private. it CAN be done without that but this is more reliable. if ($self->private_mount || $self->private_tmp) { mount("/", "/", undef, MS_REC|MS_PRIVATE, undef); } if ($self->private_tmp) { if (ref $self->private_tmp eq 'HASH') { mount("/tmp", "/tmp", "tmpfs", 0, undef); mount("/tmp", "/tmp", "tmpfs", MS_PRIVATE, $self->private_tmp); } elsif (ref $self->private_tmp) { # TODO do this with a constraint? die "Bad ref type passed as private_tmp"; } else { mount("/tmp", "/tmp", "tmpfs", 0, undef); mount("/tmp", "/tmp", "tmpfs", MS_PRIVATE, undef); } } } sub setup { my ($self, %args) = @_; my $uflags = $self->_uflags; $self->pre_setup(%args); my $code = $args{code} // $self->code(); if ($code) { $self->_subprocess(sub { unshare($uflags); # We've just unshared, if we wanted a private pid space we MUST fork again. if ($self->private_pid) { $self->_subprocess(sub { $self->post_setup(%args); $code->(%args); }, %args); } else { $self->post_setup(%args); $code->(%args); } }, %args); } else { unshare($uflags); $self->post_setup(%args); } return 1; } 1; __END__ =head1 NAME Sys::Linux::Namespace - A Module for setting up linux namespaces =head1 SYNOPSIS use Sys::Linux::Namespace; # Create a namespace with a private /tmp my $ns1 = Sys::Linux::Namespace->new(private_tmp => 1); $ns1->setup(code => sub { # This code has it's own completely private /tmp filesystem open(my $fh, "new(private_tmp => 1, private_pid => 1); $ns2->setup(code => sub { # I will only see PID 1. I can fork anything I want and they will only see me # if I die they die too. use Data::Dumper; print Dumper([glob "/proc/*"]); }); # We're back to our previous global /tmp and PID namespace # all processes and private filesystems have been removed # Now let's set up a private /tmp $ns1->setup(); # We're now permanently (for this process) using a private /tmp. =head1 REQUIREMENTS This module requires your script to have CAP_SYS_ADMIN, usually by running as C. Without that it will fail to setup the namespaces and cause your program to exit. =head1 METHODS =head2 C Construct a new Sys::Linux::Namespace object. This collects all the options you want to enable, but does not engage them. All arguments are passed in like a hash. =over 1 =item code A coderef to run when setting up the namespaces. This gets run in a child process that's isolated from the parent. If you don't pass one in during construction or to C then the namespace changes will happen to the current process. =item private_mount Setup a private mount namespace, this makes every currently mounted filesystem private to our process. This means we can unmount and mount new filesystems without other processes seeing the mounts. =item private_tmp Sets up the private mount namespace as above, but also automatically sets up /tmp to be a clean private tmpfs mount. Takes either a true value, or a hashref with options to pass to the mount syscall. See C for a list of possible options. =item private_pid Create a private PID namespace. This requires a C parameter either to C or to C =item private_net TODO This is not yet implemented. Once done however, it will allow a child process to execute with a private network preventing communication. Will require a C parameter to C or C. =item private_ipc Create a private IPC namespace. =item private_user Create a new user namespace. See C for more information. =item private_uts Create a new UTS namespace. This will let you safely change the hostname of the system without affect anyone else. =item private_sysvsem Create a new System V Semaphore namespace. This will let you create new semaphores without anyone else touching them. =back =head2 C Engage the namespaces with all the configured options. All arguments are passed by name like a hash. You may pass in a C parameter to run in a child process, this overrides one provided during construction. Any other parameters are passed through to your coderef if present. =head1 AUTHOR Ryan Voots L =cut