@@ -832,6 +832,25 @@ void send_mountsources(int sockfd, pid_t child, char *mountsources, size_t mount
832
832
bail ("failed to close container mount namespace fd %d" , container_mntns_fd );
833
833
}
834
834
835
+ void try_unshare (int flags , const char * msg )
836
+ {
837
+ write_log (DEBUG , "unshare %s" , msg );
838
+ /*
839
+ * Kernels prior to v4.3 may return EINVAL on unshare when another process
840
+ * reads runc's /proc/$PID/status or /proc/$PID/maps. To work around this,
841
+ * retry on EINVAL a few times.
842
+ */
843
+ int retries = 5 ;
844
+ for (; retries > 0 ; retries -- ) {
845
+ if (unshare (flags ) == 0 ) {
846
+ return ;
847
+ }
848
+ if (errno != EINVAL )
849
+ break ;
850
+ }
851
+ bail ("failed to unshare %s" , msg );
852
+ }
853
+
835
854
void nsexec (void )
836
855
{
837
856
int pipenum ;
@@ -1170,9 +1189,7 @@ void nsexec(void)
1170
1189
* problem.
1171
1190
*/
1172
1191
if (config .cloneflags & CLONE_NEWUSER ) {
1173
- write_log (DEBUG , "unshare user namespace" );
1174
- if (unshare (CLONE_NEWUSER ) < 0 )
1175
- bail ("failed to unshare user namespace" );
1192
+ try_unshare (CLONE_NEWUSER , "user namespace" );
1176
1193
config .cloneflags &= ~CLONE_NEWUSER ;
1177
1194
1178
1195
/*
@@ -1224,9 +1241,7 @@ void nsexec(void)
1224
1241
* some old kernel versions where clone(CLONE_PARENT | CLONE_NEWPID)
1225
1242
* was broken, so we'll just do it the long way anyway.
1226
1243
*/
1227
- write_log (DEBUG , "unshare remaining namespace (except cgroupns)" );
1228
- if (unshare (config .cloneflags & ~CLONE_NEWCGROUP ) < 0 )
1229
- bail ("failed to unshare remaining namespaces (except cgroupns)" );
1244
+ try_unshare (config .cloneflags & ~CLONE_NEWCGROUP , "remaining namespaces (except cgroupns)" );
1230
1245
1231
1246
/* Ask our parent to send the mount sources fds. */
1232
1247
if (config .mountsources ) {
@@ -1344,8 +1359,7 @@ void nsexec(void)
1344
1359
}
1345
1360
1346
1361
if (config .cloneflags & CLONE_NEWCGROUP ) {
1347
- if (unshare (CLONE_NEWCGROUP ) < 0 )
1348
- bail ("failed to unshare cgroup namespace" );
1362
+ try_unshare (CLONE_NEWCGROUP , "cgroup namespace" );
1349
1363
}
1350
1364
1351
1365
write_log (DEBUG , "signal completion to stage-0" );
0 commit comments