#include <ctype.h>
#include <sys/resource.h>
#include <fcntl.h>
+#define _GNU_SOURCE
+#include <sched.h>
#include "vserver.h"
#include "planetlab.h"
+#ifndef VC_NXC_RAW_SOCKET
+# define VC_NXC_RAW_SOCKET 0x00000200ull
+#endif
+#ifndef VC_NXC_RAW_SEND
+# define VC_NXC_RAW_SEND 0x00000400ull
+#endif
+#ifndef VC_NXF_LBACK_ALLOW
+# define VC_NXF_LBACK_ALLOW 0x00000400ull
+#endif
+
static int
-create_context(xid_t ctx, uint64_t bcaps)
+create_context(xid_t ctx, uint64_t bcaps, uint32_t unshare_flags)
{
- struct vc_ctx_caps vc_caps;
+ struct vc_ctx_caps vc_caps;
struct vc_net_flags vc_nf;
+ struct vc_net_caps vc_ncaps;
/* Create network context */
if (vc_net_create(ctx) == VC_NOCTX) {
}
/* Make the network context persistent */
- vc_nf.mask = vc_nf.flagword = VC_NXF_PERSISTENT;
+ vc_nf.mask = vc_nf.flagword = VC_NXF_PERSISTENT | VC_NXF_LBACK_ALLOW;
if (vc_set_nflags(ctx, &vc_nf))
return -1;
+ /* Give it raw sockets capabilities */
+ vc_ncaps.ncaps = vc_ncaps.cmask = VC_NXC_RAW_ICMP | VC_NXC_RAW_SOCKET;
+ if (vc_set_ncaps(ctx, &vc_ncaps))
+ return -1;
+
tag:
/* Create tag context */
if (vc_tag_create(ctx) == VC_NOCTX)
return -1;
process:
+
/*
* Create context info - this sets the STATE_SETUP and STATE_INIT flags.
*/
if (vc_ctx_create(ctx, 0) == VC_NOCTX)
return -1;
+ if (unshare_flags != 0) {
+ unshare(unshare_flags);
+ unshare_flags |= vc_get_space_mask();
+ //printf("vc_set_namespace(%d, %X)\n", ctx, unshare_flags);
+ //vc_set_namespace(ctx, unshare_flags);
+ }
+
/* Set capabilities - these don't take effect until SETUP flag is unset */
vc_caps.bcaps = bcaps;
vc_caps.bmask = ~0ULL; /* currently unused */
#define RETRY_LIMIT 10
int
-pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr)
+pl_chcontext(xid_t ctx, uint64_t bcaps, const struct sliver_resources *slr,
+ int unshare_netns)
{
int retry_count = 0;
int net_migrated = 0;
-
- pl_set_ulimits(slr);
+
+ if (pl_set_ulimits(slr) != 0)
+ return -1;
for (;;)
{
if (vc_get_cflags(ctx, &vc_flags))
{
+ uint32_t unshare_flags;
if (errno != ESRCH)
return -1;
+ /* Always unshare the net namespace for a new context */
+ unshare_flags = CLONE_NEWNET;
+
/* context doesn't exist - create it */
- if (create_context(ctx, bcaps))
+ if (create_context(ctx, bcaps, unshare_flags))
{
if (errno == EEXIST)
/* another process beat us in a race */
migrate:
if (net_migrated || !vc_net_migrate(ctx))
{
+ uint32_t unshare_flags;
+
+ /* Unshare the net namespace if requested in the slice config */
+ unshare_flags = unshare_netns ? CLONE_NEWNET : 0;
+
+ if (unshare_flags != 0) {
+ unshare_flags |=vc_get_space_mask();
+ //printf("vc_enter_namespace(%d, %X)\n", ctx, unshare_flags);
+ //vc_enter_namespace(ctx, unshare_flags);
+ }
+
if (!vc_tag_migrate(ctx) && !vc_ctx_migrate(ctx, 0))
break; /* done */
net_migrated = 1;
return 0;
}
+enum {
+ TYPE_LONG = 1,
+ TYPE_PERS = 2,
+};
+
struct pl_resources {
char *name;
- unsigned long long *limit;
+ unsigned type;
+ union {
+ unsigned long long *limit;
+ unsigned long int *personality;
+ };
};
#define WHITESPACE(buffer,index,len) \
if (index < len) index++; else goto out;
#define VSERVERCONF "/etc/vservers/"
+
void
pl_get_limits(const char *context, struct sliver_resources *slr)
{
char *conf = (char *)malloc(len + strlen("rlimits/openfd.hard"));
struct pl_resources *r;
struct pl_resources sliver_list[] = {
- {"sched/fill-rate2", &slr->vs_cpu},
+ {"sched/fill-rate2", TYPE_LONG, &slr->vs_cpu},
- {"rlimits/nproc.hard", &slr->vs_nproc.hard},
- {"rlimits/nproc.soft", &slr->vs_nproc.soft},
- {"rlimits/nproc.min", &slr->vs_nproc.min},
+ {"rlimits/nproc.hard", TYPE_LONG, &slr->vs_nproc.hard},
+ {"rlimits/nproc.soft", TYPE_LONG, &slr->vs_nproc.soft},
+ {"rlimits/nproc.min", TYPE_LONG, &slr->vs_nproc.min},
- {"rlimits/rss.hard", &slr->vs_rss.hard},
- {"rlimits/rss.soft", &slr->vs_rss.soft},
- {"rlimits/rss.min", &slr->vs_rss.min},
+ {"rlimits/rss.hard", TYPE_LONG, &slr->vs_rss.hard},
+ {"rlimits/rss.soft", TYPE_LONG, &slr->vs_rss.soft},
+ {"rlimits/rss.min", TYPE_LONG, &slr->vs_rss.min},
- {"rlimits/as.hard", &slr->vs_as.hard},
- {"rlimits/as.soft", &slr->vs_as.soft},
- {"rlimits/as.min", &slr->vs_as.min},
+ {"rlimits/as.hard", TYPE_LONG, &slr->vs_as.hard},
+ {"rlimits/as.soft", TYPE_LONG, &slr->vs_as.soft},
+ {"rlimits/as.min", TYPE_LONG, &slr->vs_as.min},
- {"rlimits/openfd.hard", &slr->vs_openfd.hard},
- {"rlimits/openfd.soft", &slr->vs_openfd.soft},
- {"rlimits/openfd.min", &slr->vs_openfd.min},
+ {"rlimits/openfd.hard", TYPE_LONG, &slr->vs_openfd.hard},
+ {"rlimits/openfd.soft", TYPE_LONG, &slr->vs_openfd.soft},
+ {"rlimits/openfd.min", TYPE_LONG, &slr->vs_openfd.min},
+
+ {"personality", TYPE_PERS, &slr->personality},
{0,0}
};
slr->vs_openfd.soft = VC_LIM_KEEP;
slr->vs_openfd.min = VC_LIM_KEEP;
+ slr->personality = 0;
+
cwd = open(".", O_RDONLY);
if (cwd == -1) {
perror("cannot get a handle on .");
fb = fopen(r->name, "r");
if (fb == NULL)
continue;
- if (fgets(buf, sizeof(buf), fb) != NULL && isdigit(*buf))
- *r->limit = atoi(buf);
+ if (fgets(buf, sizeof(buf), fb) != NULL) {
+ len=strlen(buf);
+ /* remove trailing newline */
+ if (buf[len-1] == '\n') {
+ buf[len-1]='\0';
+ len --;
+ }
+ if ( (r->type == TYPE_LONG) && isdigit(*buf)) {
+ *r->limit = atoi(buf);
+ } else if ( (r->type == TYPE_PERS) && isalpha(*buf)) {
+ unsigned long int res;
+ res = vc_str2personalitytype(buf,len);
+ if (res != VC_BAD_PERSONALITY) {
+ *r->personality = res;
+ }
+ }
+ }
+
fclose(fb);
}
if (vcr->hard < vcr->min)
break;
case 0:
- lim->rlim_cur = vcr->hard;
+ lim->rlim_max = vcr->hard;
adjusted = 1;
}
}
setrlimit(resource, &lim);
}
-void
+static inline int
+set_personality(unsigned long int personality_arg)
+{
+ if (personality_arg == 0)
+ return 0;
+ if (personality(personality_arg) < 0) {
+ return -1;
+ }
+ return 0;
+}
+
+int
pl_set_ulimits(const struct sliver_resources *slr)
{
if (!slr)
- return;
+ return 0;
set_one_ulimit(RLIMIT_RSS, &slr->vs_rss);
set_one_ulimit(RLIMIT_AS, &slr->vs_as);
set_one_ulimit(RLIMIT_NPROC, &slr->vs_nproc);
set_one_ulimit(RLIMIT_NOFILE, &slr->vs_openfd);
+ return set_personality(slr->personality);
}