X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=src%2Fplanetlab.c;h=b931e812d13ab2e66d1c08fb6a7aef61353e0821;hb=361e96e42610e4f7600ae1175617f110874f563e;hp=9300744a5be31fb2056ef7c45dbbcae72a506450;hpb=c4ab647140e6387139cb7fd54c43e96fc6981a5c;p=util-vserver-pl.git diff --git a/src/planetlab.c b/src/planetlab.c index 9300744..b931e81 100644 --- a/src/planetlab.c +++ b/src/planetlab.c @@ -44,15 +44,28 @@ POSSIBILITY OF SUCH DAMAGE. #include #include #include +#define _GNU_SOURCE +#include #include "vserver.h" #include "planetlab.h" +#ifndef VC_NXC_RAW_SOCKET +# define VC_NXC_RAW_SOCKET 0x00000200ull +#endif +#ifndef VC_NXC_RAW_SEND +# define VC_NXC_RAW_SEND 0x00000400ull +#endif +#ifndef VC_NXF_LBACK_ALLOW +# define VC_NXF_LBACK_ALLOW 0x00000400ull +#endif + static int -create_context(xid_t ctx, uint64_t bcaps) +create_context(xid_t ctx, uint64_t bcaps, uint32_t unshare_flags) { - struct vc_ctx_caps vc_caps; + struct vc_ctx_caps vc_caps; struct vc_net_flags vc_nf; + struct vc_net_caps vc_ncaps; /* Create network context */ if (vc_net_create(ctx) == VC_NOCTX) { @@ -62,22 +75,35 @@ create_context(xid_t ctx, uint64_t bcaps) } /* Make the network context persistent */ - vc_nf.mask = vc_nf.flagword = VC_NXF_PERSISTENT; + vc_nf.mask = vc_nf.flagword = VC_NXF_PERSISTENT | VC_NXF_LBACK_ALLOW; if (vc_set_nflags(ctx, &vc_nf)) return -1; + /* Give it raw sockets capabilities */ + vc_ncaps.ncaps = vc_ncaps.cmask = VC_NXC_RAW_ICMP | VC_NXC_RAW_SOCKET; + if (vc_set_ncaps(ctx, &vc_ncaps)) + return -1; + tag: /* Create tag context */ if (vc_tag_create(ctx) == VC_NOCTX) return -1; process: + /* * Create context info - this sets the STATE_SETUP and STATE_INIT flags. */ if (vc_ctx_create(ctx, 0) == VC_NOCTX) return -1; + if (unshare_flags != 0) { + unshare(unshare_flags); + unshare_flags |= vc_get_space_mask(); + //printf("vc_set_namespace(%d, %X)\n", ctx, unshare_flags); + //vc_set_namespace(ctx, unshare_flags); + } + /* Set capabilities - these don't take effect until SETUP flag is unset */ vc_caps.bcaps = bcaps; vc_caps.bmask = ~0ULL; /* currently unused */ @@ -113,12 +139,14 @@ pl_setup_done(xid_t ctx) #define RETRY_LIMIT 10 int -pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr) +pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr, + int unshare_netns) { int retry_count = 0; int net_migrated = 0; - - pl_set_ulimits(slr); + + if (pl_set_ulimits(slr) != 0) + return -1; for (;;) { @@ -126,11 +154,15 @@ pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr) if (vc_get_cflags(ctx, &vc_flags)) { + uint32_t unshare_flags; if (errno != ESRCH) return -1; + /* Always unshare the net namespace for a new context */ + unshare_flags = CLONE_NEWNET; + /* context doesn't exist - create it */ - if (create_context(ctx, bcaps)) + if (create_context(ctx, bcaps, unshare_flags)) { if (errno == EEXIST) /* another process beat us in a race */ @@ -162,6 +194,17 @@ pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr) migrate: if (net_migrated || !vc_net_migrate(ctx)) { + uint32_t unshare_flags; + + /* Unshare the net namespace if requested in the slice config */ + unshare_flags = unshare_netns ? CLONE_NEWNET : 0; + + if (unshare_flags != 0) { + unshare_flags |=vc_get_space_mask(); + //printf("vc_enter_namespace(%d, %X)\n", ctx, unshare_flags); + //vc_enter_namespace(ctx, unshare_flags); + } + if (!vc_tag_migrate(ctx) && !vc_ctx_migrate(ctx, 0)) break; /* done */ net_migrated = 1; @@ -215,9 +258,18 @@ pl_setsched(xid_t ctx, uint32_t cpu_min, uint32_t cpu_share) return 0; } +enum { + TYPE_LONG = 1, + TYPE_PERS = 2, +}; + struct pl_resources { char *name; - unsigned long long *limit; + unsigned type; + union { + unsigned long long *limit; + unsigned long int *personality; + }; }; #define WHITESPACE(buffer,index,len) \ @@ -225,6 +277,7 @@ struct pl_resources { if (index < len) index++; else goto out; #define VSERVERCONF "/etc/vservers/" + void pl_get_limits(const char *context, struct sliver_resources *slr) { @@ -234,23 +287,25 @@ pl_get_limits(const char *context, struct sliver_resources *slr) char *conf = (char *)malloc(len + strlen("rlimits/openfd.hard")); struct pl_resources *r; struct pl_resources sliver_list[] = { - {"sched/fill-rate2", &slr->vs_cpu}, + {"sched/fill-rate2", TYPE_LONG, &slr->vs_cpu}, - {"rlimits/nproc.hard", &slr->vs_nproc.hard}, - {"rlimits/nproc.soft", &slr->vs_nproc.soft}, - {"rlimits/nproc.min", &slr->vs_nproc.min}, + {"rlimits/nproc.hard", TYPE_LONG, &slr->vs_nproc.hard}, + {"rlimits/nproc.soft", TYPE_LONG, &slr->vs_nproc.soft}, + {"rlimits/nproc.min", TYPE_LONG, &slr->vs_nproc.min}, - {"rlimits/rss.hard", &slr->vs_rss.hard}, - {"rlimits/rss.soft", &slr->vs_rss.soft}, - {"rlimits/rss.min", &slr->vs_rss.min}, + {"rlimits/rss.hard", TYPE_LONG, &slr->vs_rss.hard}, + {"rlimits/rss.soft", TYPE_LONG, &slr->vs_rss.soft}, + {"rlimits/rss.min", TYPE_LONG, &slr->vs_rss.min}, - {"rlimits/as.hard", &slr->vs_as.hard}, - {"rlimits/as.soft", &slr->vs_as.soft}, - {"rlimits/as.min", &slr->vs_as.min}, + {"rlimits/as.hard", TYPE_LONG, &slr->vs_as.hard}, + {"rlimits/as.soft", TYPE_LONG, &slr->vs_as.soft}, + {"rlimits/as.min", TYPE_LONG, &slr->vs_as.min}, - {"rlimits/openfd.hard", &slr->vs_openfd.hard}, - {"rlimits/openfd.soft", &slr->vs_openfd.soft}, - {"rlimits/openfd.min", &slr->vs_openfd.min}, + {"rlimits/openfd.hard", TYPE_LONG, &slr->vs_openfd.hard}, + {"rlimits/openfd.soft", TYPE_LONG, &slr->vs_openfd.soft}, + {"rlimits/openfd.min", TYPE_LONG, &slr->vs_openfd.min}, + + {"personality", TYPE_PERS, &slr->personality}, {0,0} }; @@ -273,6 +328,8 @@ pl_get_limits(const char *context, struct sliver_resources *slr) slr->vs_openfd.soft = VC_LIM_KEEP; slr->vs_openfd.min = VC_LIM_KEEP; + slr->personality = 0; + cwd = open(".", O_RDONLY); if (cwd == -1) { perror("cannot get a handle on ."); @@ -289,8 +346,24 @@ pl_get_limits(const char *context, struct sliver_resources *slr) fb = fopen(r->name, "r"); if (fb == NULL) continue; - if (fgets(buf, sizeof(buf), fb) != NULL && isdigit(*buf)) - *r->limit = atoi(buf); + if (fgets(buf, sizeof(buf), fb) != NULL) { + len=strlen(buf); + /* remove trailing newline */ + if (buf[len-1] == '\n') { + buf[len-1]='\0'; + len --; + } + if ( (r->type == TYPE_LONG) && isdigit(*buf)) { + *r->limit = atoi(buf); + } else if ( (r->type == TYPE_PERS) && isalpha(*buf)) { + unsigned long int res; + res = vc_str2personalitytype(buf,len); + if (res != VC_BAD_PERSONALITY) { + *r->personality = res; + } + } + } + fclose(fb); } @@ -333,7 +406,7 @@ adjust_lim(const struct vc_rlimit *vcr, struct rlimit *lim) if (vcr->hard < vcr->min) break; case 0: - lim->rlim_cur = vcr->hard; + lim->rlim_max = vcr->hard; adjusted = 1; } } @@ -349,14 +422,26 @@ set_one_ulimit(int resource, const struct vc_rlimit *limit) setrlimit(resource, &lim); } -void +static inline int +set_personality(unsigned long int personality_arg) +{ + if (personality_arg == 0) + return 0; + if (personality(personality_arg) < 0) { + return -1; + } + return 0; +} + +int pl_set_ulimits(const struct sliver_resources *slr) { if (!slr) - return; + return 0; set_one_ulimit(RLIMIT_RSS, &slr->vs_rss); set_one_ulimit(RLIMIT_AS, &slr->vs_as); set_one_ulimit(RLIMIT_NPROC, &slr->vs_nproc); set_one_ulimit(RLIMIT_NOFILE, &slr->vs_openfd); + return set_personality(slr->personality); }