bsd/kern/sysv_sem.c

   1 /*
   2  * Copyright (c) 2000-2019 Apple Inc. All rights reserved.
   3  *
   4  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
   5  *
   6  * This file contains Original Code and/or Modifications of Original Code
   7  * as defined in and that are subject to the Apple Public Source License
   8  * Version 2.0 (the 'License'). You may not use this file except in
   9  * compliance with the License. The rights granted to you under the License
  10  * may not be used to create, or enable the creation or redistribution of,
  11  * unlawful or unlicensed copies of an Apple operating system, or to
  12  * circumvent, violate, or enable the circumvention or violation of, any
  13  * terms of an Apple operating system software license agreement.
  14  *
  15  * Please obtain a copy of the License at
  16  * http://www.opensource.apple.com/apsl/ and read it before using this file.
  17  *
  18  * The Original Code and all software distributed under the License are
  19  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  20  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
  21  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
  22  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
  23  * Please see the License for the specific language governing rights and
  24  * limitations under the License.
  25  *
  26  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
  27  */
  28 /*
  29  * Implementation of SVID semaphores
  30  *
  31  * Author:  Daniel Boulet
  32  *
  33  * This software is provided ``AS IS'' without any warranties of any kind.
  34  */
  35 /*
  36  * John Bellardo modified the implementation for Darwin. 12/2000
  37  */
  38 /*
  39  * NOTICE: This file was modified by McAfee Research in 2004 to introduce
  40  * support for mandatory and extensible security protections.  This notice
  41  * is included in support of clause 2.2 (b) of the Apple Public License,
  42  * Version 2.0.
  43  * Copyright (c) 2005-2006 SPARTA, Inc.
  44  */
  45
  46 #include <sys/param.h>
  47 #include <sys/systm.h>
  48 #include <sys/kernel.h>
  49 #include <sys/proc_internal.h>
  50 #include <sys/kauth.h>
  51 #include <sys/sem_internal.h>
  52 #include <sys/malloc.h>
  53 #include <mach/mach_types.h>
  54
  55 #include <sys/filedesc.h>
  56 #include <sys/file_internal.h>
  57 #include <sys/sysctl.h>
  58 #include <sys/ipcs.h>
  59 #include <sys/sysent.h>
  60 #include <sys/sysproto.h>
  61 #if CONFIG_MACF
  62 #include <security/mac_framework.h>
  63 #endif
  64
  65 #include <security/audit/audit.h>
  66
  67 #if SYSV_SEM
  68
  69
  70 /* Uncomment this line to see the debugging output */
  71 /* #define SEM_DEBUG */
  72
  73 /* Uncomment this line to see MAC debugging output. */
  74 /* #define      MAC_DEBUG */
  75 #if CONFIG_MACF_DEBUG
  76 #define MPRINTF(a)      printf(a)
  77 #else
  78 #define MPRINTF(a)
  79 #endif
  80
  81 #define M_SYSVSEM       M_TEMP
  82
  83
  84 /* Hard system limits to avoid resource starvation / DOS attacks.
  85  * These are not needed if we can make the semaphore pages swappable.
  86  */
  87 static struct seminfo limitseminfo = {
  88         .semmap = SEMMAP,        /* # of entries in semaphore map */
  89         .semmni = SEMMNI,        /* # of semaphore identifiers */
  90         .semmns = SEMMNS,        /* # of semaphores in system */
  91         .semmnu = SEMMNU,        /* # of undo structures in system */
  92         .semmsl = SEMMSL,        /* max # of semaphores per id */
  93         .semopm = SEMOPM,        /* max # of operations per semop call */
  94         .semume = SEMUME,        /* max # of undo entries per process */
  95         .semusz = SEMUSZ,        /* size in bytes of undo structure */
  96         .semvmx = SEMVMX,        /* semaphore maximum value */
  97         .semaem = SEMAEM         /* adjust on exit max value */
  98 };
  99
 100 /* Current system allocations.  We use this structure to track how many
 101  * resources we have allocated so far.  This way we can set large hard limits
 102  * and not allocate the memory for them up front.
 103  */
 104 struct seminfo seminfo = {
 105         .semmap = SEMMAP,       /* Unused, # of entries in semaphore map */
 106         .semmni = 0,            /* # of semaphore identifiers */
 107         .semmns = 0,            /* # of semaphores in system */
 108         .semmnu = 0,            /* # of undo entries in system */
 109         .semmsl = SEMMSL,       /* max # of semaphores per id */
 110         .semopm = SEMOPM,       /* max # of operations per semop call */
 111         .semume = SEMUME,       /* max # of undo entries per process */
 112         .semusz = SEMUSZ,       /* size in bytes of undo structure */
 113         .semvmx = SEMVMX,       /* semaphore maximum value */
 114         .semaem = SEMAEM        /* adjust on exit max value */
 115 };
 116
 117
 118 static int semu_alloc(struct proc *p);
 119 static int semundo_adjust(struct proc *p, int *supidx,
 120     int semid, int semnum, int adjval);
 121 static void semundo_clear(int semid, int semnum);
 122
 123 /* XXX casting to (sy_call_t *) is bogus, as usual. */
 124 static sy_call_t* const semcalls[] = {
 125         (sy_call_t *)semctl, (sy_call_t *)semget,
 126         (sy_call_t *)semop
 127 };
 128
 129 static int              semtot = 0;             /* # of used semaphores */
 130 struct semid_kernel     *sema = NULL;           /* semaphore id pool */
 131 struct sem              *sem_pool =  NULL;      /* semaphore pool */
 132 static int              semu_list_idx = -1;     /* active undo structures */
 133 struct sem_undo         *semu = NULL;           /* semaphore undo pool */
 134
 135
 136 void sysv_sem_lock_init(void);
 137 static lck_grp_t       *sysv_sem_subsys_lck_grp;
 138 static lck_grp_attr_t  *sysv_sem_subsys_lck_grp_attr;
 139 static lck_attr_t      *sysv_sem_subsys_lck_attr;
 140 static lck_mtx_t        sysv_sem_subsys_mutex;
 141
 142 #define SYSV_SEM_SUBSYS_LOCK() lck_mtx_lock(&sysv_sem_subsys_mutex)
 143 #define SYSV_SEM_SUBSYS_UNLOCK() lck_mtx_unlock(&sysv_sem_subsys_mutex)
 144
 145
 146 __private_extern__ void
 147 sysv_sem_lock_init( void )
 148 {
 149         sysv_sem_subsys_lck_grp_attr = lck_grp_attr_alloc_init();
 150
 151         sysv_sem_subsys_lck_grp = lck_grp_alloc_init("sysv_sem_subsys_lock", sysv_sem_subsys_lck_grp_attr);
 152
 153         sysv_sem_subsys_lck_attr = lck_attr_alloc_init();
 154         lck_mtx_init(&sysv_sem_subsys_mutex, sysv_sem_subsys_lck_grp, sysv_sem_subsys_lck_attr);
 155 }
 156
 157 static __inline__ user_time_t
 158 sysv_semtime(void)
 159 {
 160         struct timeval  tv;
 161         microtime(&tv);
 162         return tv.tv_sec;
 163 }
 164
 165 /*
 166  * XXX conversion of internal user_time_t to external tume_t loses
 167  * XXX precision; not an issue for us now, since we are only ever
 168  * XXX setting 32 bits worth of time into it.
 169  *
 170  * pad field contents are not moved correspondingly; contents will be lost
 171  *
 172  * NOTE: Source and target may *NOT* overlap! (target is smaller)
 173  */
 174 static void
 175 semid_ds_kernelto32(struct user_semid_ds *in, struct user32_semid_ds *out)
 176 {
 177         out->sem_perm = in->sem_perm;
 178         out->sem_base = CAST_DOWN_EXPLICIT(__int32_t, in->sem_base);
 179         out->sem_nsems = in->sem_nsems;
 180         out->sem_otime = in->sem_otime;         /* XXX loses precision */
 181         out->sem_ctime = in->sem_ctime;         /* XXX loses precision */
 182 }
 183
 184 static void
 185 semid_ds_kernelto64(struct user_semid_ds *in, struct user64_semid_ds *out)
 186 {
 187         out->sem_perm = in->sem_perm;
 188         out->sem_base = CAST_DOWN_EXPLICIT(__int32_t, in->sem_base);
 189         out->sem_nsems = in->sem_nsems;
 190         out->sem_otime = in->sem_otime;         /* XXX loses precision */
 191         out->sem_ctime = in->sem_ctime;         /* XXX loses precision */
 192 }
 193
 194 /*
 195  * pad field contents are not moved correspondingly; contents will be lost
 196  *
 197  * NOTE: Source and target may are permitted to overlap! (source is smaller);
 198  * this works because we copy fields in order from the end of the struct to
 199  * the beginning.
 200  *
 201  * XXX use CAST_USER_ADDR_T() for lack of a CAST_USER_TIME_T(); net effect
 202  * XXX is the same.
 203  */
 204 static void
 205 semid_ds_32tokernel(struct user32_semid_ds *in, struct user_semid_ds *out)
 206 {
 207         out->sem_ctime = in->sem_ctime;
 208         out->sem_otime = in->sem_otime;
 209         out->sem_nsems = in->sem_nsems;
 210         out->sem_base = (void *)(uintptr_t)in->sem_base;
 211         out->sem_perm = in->sem_perm;
 212 }
 213
 214 static void
 215 semid_ds_64tokernel(struct user64_semid_ds *in, struct user_semid_ds *out)
 216 {
 217         out->sem_ctime = in->sem_ctime;
 218         out->sem_otime = in->sem_otime;
 219         out->sem_nsems = in->sem_nsems;
 220         out->sem_base = (void *)(uintptr_t)in->sem_base;
 221         out->sem_perm = in->sem_perm;
 222 }
 223
 224
 225 /*
 226  * semsys
 227  *
 228  * Entry point for all SEM calls: semctl, semget, semop
 229  *
 230  * Parameters:  p       Process requesting the call
 231  *              uap     User argument descriptor (see below)
 232  *              retval  Return value of the selected sem call
 233  *
 234  * Indirect parameters: uap->which      sem call to invoke (index in array of sem calls)
 235  *                      uap->a2         User argument descriptor
 236  *
 237  * Returns:     0       Success
 238  *              !0      Not success
 239  *
 240  * Implicit returns: retval     Return value of the selected sem call
 241  *
 242  * DEPRECATED:  This interface should not be used to call the other SEM
 243  *              functions (semctl, semget, semop). The correct usage is
 244  *              to call the other SEM functions directly.
 245  *
 246  */
 247 int
 248 semsys(struct proc *p, struct semsys_args *uap, int32_t *retval)
 249 {
 250         /* The individual calls handling the locking now */
 251
 252         if (uap->which >= sizeof(semcalls) / sizeof(semcalls[0])) {
 253                 return EINVAL;
 254         }
 255         return (*semcalls[uap->which])(p, &uap->a2, retval);
 256 }
 257
 258 /*
 259  * Expand the semu array to the given capacity.  If the expansion fails
 260  * return 0, otherwise return 1.
 261  *
 262  * Assumes we already have the subsystem lock.
 263  */
 264 static int
 265 grow_semu_array(int newSize)
 266 {
 267         int i;
 268         struct sem_undo *newSemu;
 269
 270         if (newSize <= seminfo.semmnu) {
 271                 return 1;
 272         }
 273         if (newSize > limitseminfo.semmnu) { /* enforce hard limit */
 274 #ifdef SEM_DEBUG
 275                 printf("undo structure hard limit of %d reached, requested %d\n",
 276                     limitseminfo.semmnu, newSize);
 277 #endif
 278                 return 0;
 279         }
 280         newSize = (newSize / SEMMNU_INC + 1) * SEMMNU_INC;
 281         newSize = newSize > limitseminfo.semmnu ? limitseminfo.semmnu : newSize;
 282
 283 #ifdef SEM_DEBUG
 284         printf("growing semu[] from %d to %d\n", seminfo.semmnu, newSize);
 285 #endif
 286         MALLOC(newSemu, struct sem_undo *, sizeof(struct sem_undo) * newSize,
 287             M_SYSVSEM, M_WAITOK | M_ZERO);
 288         if (NULL == newSemu) {
 289 #ifdef SEM_DEBUG
 290                 printf("allocation failed.  no changes made.\n");
 291 #endif
 292                 return 0;
 293         }
 294
 295         /* copy the old data to the new array */
 296         for (i = 0; i < seminfo.semmnu; i++) {
 297                 newSemu[i] = semu[i];
 298         }
 299         /*
 300          * The new elements (from newSemu[i] to newSemu[newSize-1]) have their
 301          * "un_proc" set to 0 (i.e. NULL) by the M_ZERO flag to MALLOC() above,
 302          * so they're already marked as "not in use".
 303          */
 304
 305         /* Clean up the old array */
 306         if (semu) {
 307                 FREE(semu, M_SYSVSEM);
 308         }
 309
 310         semu = newSemu;
 311         seminfo.semmnu = newSize;
 312 #ifdef SEM_DEBUG
 313         printf("expansion successful\n");
 314 #endif
 315         return 1;
 316 }
 317
 318 /*
 319  * Expand the sema array to the given capacity.  If the expansion fails
 320  * we return 0, otherwise we return 1.
 321  *
 322  * Assumes we already have the subsystem lock.
 323  */
 324 static int
 325 grow_sema_array(int newSize)
 326 {
 327         struct semid_kernel *newSema;
 328         int i;
 329
 330         if (newSize <= seminfo.semmni) {
 331                 return 0;
 332         }
 333         if (newSize > limitseminfo.semmni) { /* enforce hard limit */
 334 #ifdef SEM_DEBUG
 335                 printf("identifier hard limit of %d reached, requested %d\n",
 336                     limitseminfo.semmni, newSize);
 337 #endif
 338                 return 0;
 339         }
 340         newSize = (newSize / SEMMNI_INC + 1) * SEMMNI_INC;
 341         newSize = newSize > limitseminfo.semmni ? limitseminfo.semmni : newSize;
 342
 343 #ifdef SEM_DEBUG
 344         printf("growing sema[] from %d to %d\n", seminfo.semmni, newSize);
 345 #endif
 346         MALLOC(newSema, struct semid_kernel *,
 347             sizeof(struct semid_kernel) * newSize,
 348             M_SYSVSEM, M_WAITOK | M_ZERO);
 349         if (NULL == newSema) {
 350 #ifdef SEM_DEBUG
 351                 printf("allocation failed.  no changes made.\n");
 352 #endif
 353                 return 0;
 354         }
 355
 356         /* copy over the old ids */
 357         for (i = 0; i < seminfo.semmni; i++) {
 358                 newSema[i] = sema[i];
 359                 /* This is a hack.  What we really want to be able to
 360                  * do is change the value a process is waiting on
 361                  * without waking it up, but I don't know how to do
 362                  * this with the existing code, so we wake up the
 363                  * process and let it do a lot of work to determine the
 364                  * semaphore set is really not available yet, and then
 365                  * sleep on the correct, reallocated semid_kernel pointer.
 366                  */
 367                 if (sema[i].u.sem_perm.mode & SEM_ALLOC) {
 368                         wakeup((caddr_t)&sema[i]);
 369                 }
 370         }
 371
 372 #if CONFIG_MACF
 373         for (i = seminfo.semmni; i < newSize; i++) {
 374                 mac_sysvsem_label_init(&newSema[i]);
 375         }
 376 #endif
 377
 378         /*
 379          * The new elements (from newSema[i] to newSema[newSize-1]) have their
 380          * "sem_base" and "sem_perm.mode" set to 0 (i.e. NULL) by the M_ZERO
 381          * flag to MALLOC() above, so they're already marked as "not in use".
 382          */
 383
 384         /* Clean up the old array */
 385         if (sema) {
 386                 FREE(sema, M_SYSVSEM);
 387         }
 388
 389         sema = newSema;
 390         seminfo.semmni = newSize;
 391 #ifdef SEM_DEBUG
 392         printf("expansion successful\n");
 393 #endif
 394         return 1;
 395 }
 396
 397 /*
 398  * Expand the sem_pool array to the given capacity.  If the expansion fails
 399  * we return 0 (fail), otherwise we return 1 (success).
 400  *
 401  * Assumes we already hold the subsystem lock.
 402  */
 403 static int
 404 grow_sem_pool(int new_pool_size)
 405 {
 406         struct sem *new_sem_pool = NULL;
 407         struct sem *sem_free;
 408         int i;
 409
 410         if (new_pool_size < semtot) {
 411                 return 0;
 412         }
 413         /* enforce hard limit */
 414         if (new_pool_size > limitseminfo.semmns) {
 415 #ifdef SEM_DEBUG
 416                 printf("semaphore hard limit of %d reached, requested %d\n",
 417                     limitseminfo.semmns, new_pool_size);
 418 #endif
 419                 return 0;
 420         }
 421
 422         new_pool_size = (new_pool_size / SEMMNS_INC + 1) * SEMMNS_INC;
 423         new_pool_size = new_pool_size > limitseminfo.semmns ? limitseminfo.semmns : new_pool_size;
 424
 425 #ifdef SEM_DEBUG
 426         printf("growing sem_pool array from %d to %d\n", seminfo.semmns, new_pool_size);
 427 #endif
 428         MALLOC(new_sem_pool, struct sem *, sizeof(struct sem) * new_pool_size,
 429             M_SYSVSEM, M_WAITOK | M_ZERO | M_NULL);
 430         if (NULL == new_sem_pool) {
 431 #ifdef SEM_DEBUG
 432                 printf("allocation failed.  no changes made.\n");
 433 #endif
 434                 return 0;
 435         }
 436
 437         /* We have our new memory, now copy the old contents over */
 438         if (sem_pool) {
 439                 for (i = 0; i < seminfo.semmns; i++) {
 440                         new_sem_pool[i] = sem_pool[i];
 441                 }
 442         }
 443
 444         /* Update our id structures to point to the new semaphores */
 445         for (i = 0; i < seminfo.semmni; i++) {
 446                 if (sema[i].u.sem_perm.mode & SEM_ALLOC) { /* ID in use */
 447                         sema[i].u.sem_base = new_sem_pool +
 448                             (sema[i].u.sem_base - sem_pool);
 449                 }
 450         }
 451
 452         sem_free = sem_pool;
 453         sem_pool = new_sem_pool;
 454
 455         /* clean up the old array */
 456         if (sem_free != NULL) {
 457                 FREE(sem_free, M_SYSVSEM);
 458         }
 459
 460         seminfo.semmns = new_pool_size;
 461 #ifdef SEM_DEBUG
 462         printf("expansion complete\n");
 463 #endif
 464         return 1;
 465 }
 466
 467 /*
 468  * Allocate a new sem_undo structure for a process
 469  * (returns ptr to structure or NULL if no more room)
 470  *
 471  * Assumes we already hold the subsystem lock.
 472  */
 473
 474 static int
 475 semu_alloc(struct proc *p)
 476 {
 477         int i;
 478         struct sem_undo *suptr;
 479         int *supidx;
 480         int attempt;
 481
 482         /*
 483          * Try twice to allocate something.
 484          * (we'll purge any empty structures after the first pass so
 485          * two passes are always enough)
 486          */
 487
 488         for (attempt = 0; attempt < 2; attempt++) {
 489                 /*
 490                  * Look for a free structure.
 491                  * Fill it in and return it if we find one.
 492                  */
 493
 494                 for (i = 0; i < seminfo.semmnu; i++) {
 495                         suptr = SEMU(i);
 496                         if (suptr->un_proc == NULL) {
 497                                 suptr->un_next_idx = semu_list_idx;
 498                                 semu_list_idx = i;
 499                                 suptr->un_cnt = 0;
 500                                 suptr->un_ent = NULL;
 501                                 suptr->un_proc = p;
 502                                 return i;
 503                         }
 504                 }
 505
 506                 /*
 507                  * We didn't find a free one, if this is the first attempt
 508                  * then try to free some structures.
 509                  */
 510
 511                 if (attempt == 0) {
 512                         /* All the structures are in use - try to free some */
 513                         int did_something = 0;
 514
 515                         supidx = &semu_list_idx;
 516                         while (*supidx != -1) {
 517                                 suptr = SEMU(*supidx);
 518                                 if (suptr->un_cnt == 0) {
 519                                         suptr->un_proc = NULL;
 520                                         *supidx = suptr->un_next_idx;
 521                                         did_something = 1;
 522                                 } else {
 523                                         supidx = &(suptr->un_next_idx);
 524                                 }
 525                         }
 526
 527                         /* If we didn't free anything. Try expanding
 528                          * the semu[] array.  If that doesn't work
 529                          * then fail.  We expand last to get the
 530                          * most reuse out of existing resources.
 531                          */
 532                         if (!did_something) {
 533                                 if (!grow_semu_array(seminfo.semmnu + 1)) {
 534                                         return -1;
 535                                 }
 536                         }
 537                 } else {
 538                         /*
 539                          * The second pass failed even though we freed
 540                          * something after the first pass!
 541                          * This is IMPOSSIBLE!
 542                          */
 543                         panic("semu_alloc - second attempt failed");
 544                 }
 545         }
 546         return -1;
 547 }
 548
 549 /*
 550  * Adjust a particular entry for a particular proc
 551  *
 552  * Assumes we already hold the subsystem lock.
 553  */
 554 static int
 555 semundo_adjust(struct proc *p, int *supidx, int semid,
 556     int semnum, int adjval)
 557 {
 558         struct sem_undo *suptr;
 559         int suidx;
 560         struct undo *sueptr, **suepptr, *new_sueptr;
 561         int i;
 562
 563         /*
 564          * Look for and remember the sem_undo if the caller doesn't provide it
 565          */
 566
 567         suidx = *supidx;
 568         if (suidx == -1) {
 569                 for (suidx = semu_list_idx; suidx != -1;
 570                     suidx = suptr->un_next_idx) {
 571                         suptr = SEMU(suidx);
 572                         if (suptr->un_proc == p) {
 573                                 *supidx = suidx;
 574                                 break;
 575                         }
 576                 }
 577                 if (suidx == -1) {
 578                         if (adjval == 0) {
 579                                 return 0;
 580                         }
 581                         suidx = semu_alloc(p);
 582                         if (suidx == -1) {
 583                                 return ENOSPC;
 584                         }
 585                         *supidx = suidx;
 586                 }
 587         }
 588
 589         /*
 590          * Look for the requested entry and adjust it (delete if adjval becomes
 591          * 0).
 592          */
 593         suptr = SEMU(suidx);
 594         new_sueptr = NULL;
 595         for (i = 0, suepptr = &suptr->un_ent, sueptr = suptr->un_ent;
 596             i < suptr->un_cnt;
 597             i++, suepptr = &sueptr->une_next, sueptr = sueptr->une_next) {
 598                 if (sueptr->une_id != semid || sueptr->une_num != semnum) {
 599                         continue;
 600                 }
 601                 if (adjval == 0) {
 602                         sueptr->une_adjval = 0;
 603                 } else {
 604                         sueptr->une_adjval += adjval;
 605                 }
 606                 if (sueptr->une_adjval == 0) {
 607                         suptr->un_cnt--;
 608                         *suepptr = sueptr->une_next;
 609                         FREE(sueptr, M_SYSVSEM);
 610                         sueptr = NULL;
 611                 }
 612                 return 0;
 613         }
 614
 615         /* Didn't find the right entry - create it */
 616         if (adjval == 0) {
 617                 /* no adjustment: no need for a new entry */
 618                 return 0;
 619         }
 620
 621         if (suptr->un_cnt == limitseminfo.semume) {
 622                 /* reached the limit number of semaphore undo entries */
 623                 return EINVAL;
 624         }
 625
 626         /* allocate a new semaphore undo entry */
 627         MALLOC(new_sueptr, struct undo *, sizeof(struct undo),
 628             M_SYSVSEM, M_WAITOK);
 629         if (new_sueptr == NULL) {
 630                 return ENOMEM;
 631         }
 632
 633         /* fill in the new semaphore undo entry */
 634         new_sueptr->une_next = suptr->un_ent;
 635         suptr->un_ent = new_sueptr;
 636         suptr->un_cnt++;
 637         new_sueptr->une_adjval = adjval;
 638         new_sueptr->une_id = semid;
 639         new_sueptr->une_num = semnum;
 640
 641         return 0;
 642 }
 643
 644 /* Assumes we already hold the subsystem lock.
 645  */
 646 static void
 647 semundo_clear(int semid, int semnum)
 648 {
 649         struct sem_undo *suptr;
 650         int suidx;
 651
 652         for (suidx = semu_list_idx; suidx != -1; suidx = suptr->un_next_idx) {
 653                 struct undo *sueptr;
 654                 struct undo **suepptr;
 655                 int i = 0;
 656
 657                 suptr = SEMU(suidx);
 658                 sueptr = suptr->un_ent;
 659                 suepptr = &suptr->un_ent;
 660                 while (i < suptr->un_cnt) {
 661                         if (sueptr->une_id == semid) {
 662                                 if (semnum == -1 || sueptr->une_num == semnum) {
 663                                         suptr->un_cnt--;
 664                                         *suepptr = sueptr->une_next;
 665                                         FREE(sueptr, M_SYSVSEM);
 666                                         sueptr = *suepptr;
 667                                         continue;
 668                                 }
 669                                 if (semnum != -1) {
 670                                         break;
 671                                 }
 672                         }
 673                         i++;
 674                         suepptr = &sueptr->une_next;
 675                         sueptr = sueptr->une_next;
 676                 }
 677         }
 678 }
 679
 680 /*
 681  * Note that the user-mode half of this passes a union coerced to a
 682  * user_addr_t.  The union contains either an int or a pointer, and
 683  * so we have to coerce it back, variant on whether the calling
 684  * process is 64 bit or not.  The coercion works for the 'val' element
 685  * because the alignment is the same in user and kernel space.
 686  */
 687 int
 688 semctl(struct proc *p, struct semctl_args *uap, int32_t *retval)
 689 {
 690         int semid = uap->semid;
 691         int semnum = uap->semnum;
 692         int cmd = uap->cmd;
 693         user_semun_t user_arg = (user_semun_t)uap->arg;
 694         kauth_cred_t cred = kauth_cred_get();
 695         int i, rval, eval;
 696         struct user_semid_ds sbuf;
 697         struct semid_kernel *semakptr;
 698
 699
 700         AUDIT_ARG(svipc_cmd, cmd);
 701         AUDIT_ARG(svipc_id, semid);
 702
 703         SYSV_SEM_SUBSYS_LOCK();
 704
 705 #ifdef SEM_DEBUG
 706         printf("call to semctl(%d, %d, %d, 0x%qx)\n", semid, semnum, cmd, user_arg);
 707 #endif
 708
 709         semid = IPCID_TO_IX(semid);
 710
 711         if (semid < 0 || semid >= seminfo.semmni) {
 712 #ifdef SEM_DEBUG
 713                 printf("Invalid semid\n");
 714 #endif
 715                 eval = EINVAL;
 716                 goto semctlout;
 717         }
 718
 719         semakptr = &sema[semid];
 720         if ((semakptr->u.sem_perm.mode & SEM_ALLOC) == 0 ||
 721             semakptr->u.sem_perm._seq != IPCID_TO_SEQ(uap->semid)) {
 722                 eval = EINVAL;
 723                 goto semctlout;
 724         }
 725 #if CONFIG_MACF
 726         eval = mac_sysvsem_check_semctl(cred, semakptr, cmd);
 727         if (eval) {
 728                 goto semctlout;
 729         }
 730 #endif
 731
 732         eval = 0;
 733         rval = 0;
 734
 735         switch (cmd) {
 736         case IPC_RMID:
 737                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_M))) {
 738                         goto semctlout;
 739                 }
 740
 741                 semakptr->u.sem_perm.cuid = kauth_cred_getuid(cred);
 742                 semakptr->u.sem_perm.uid = kauth_cred_getuid(cred);
 743                 semtot -= semakptr->u.sem_nsems;
 744                 for (i = semakptr->u.sem_base - sem_pool; i < semtot; i++) {
 745                         sem_pool[i] = sem_pool[i + semakptr->u.sem_nsems];
 746                 }
 747                 for (i = 0; i < seminfo.semmni; i++) {
 748                         if ((sema[i].u.sem_perm.mode & SEM_ALLOC) &&
 749                             sema[i].u.sem_base > semakptr->u.sem_base) {
 750                                 sema[i].u.sem_base -= semakptr->u.sem_nsems;
 751                         }
 752                 }
 753                 semakptr->u.sem_perm.mode = 0;
 754 #if CONFIG_MACF
 755                 mac_sysvsem_label_recycle(semakptr);
 756 #endif
 757                 semundo_clear(semid, -1);
 758                 wakeup((caddr_t)semakptr);
 759                 break;
 760
 761         case IPC_SET:
 762                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_M))) {
 763                         goto semctlout;
 764                 }
 765
 766                 if (IS_64BIT_PROCESS(p)) {
 767                         struct user64_semid_ds ds64;
 768                         eval = copyin(user_arg.buf, &ds64, sizeof(ds64));
 769                         semid_ds_64tokernel(&ds64, &sbuf);
 770                 } else {
 771                         struct user32_semid_ds ds32;
 772                         eval = copyin(user_arg.buf, &ds32, sizeof(ds32));
 773                         semid_ds_32tokernel(&ds32, &sbuf);
 774                 }
 775
 776                 if (eval != 0) {
 777                         goto semctlout;
 778                 }
 779
 780                 semakptr->u.sem_perm.uid = sbuf.sem_perm.uid;
 781                 semakptr->u.sem_perm.gid = sbuf.sem_perm.gid;
 782                 semakptr->u.sem_perm.mode = (semakptr->u.sem_perm.mode &
 783                     ~0777) | (sbuf.sem_perm.mode & 0777);
 784                 semakptr->u.sem_ctime = sysv_semtime();
 785                 break;
 786
 787         case IPC_STAT:
 788                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 789                         goto semctlout;
 790                 }
 791
 792                 if (IS_64BIT_PROCESS(p)) {
 793                         struct user64_semid_ds semid_ds64;
 794                         bzero(&semid_ds64, sizeof(semid_ds64));
 795                         semid_ds_kernelto64(&semakptr->u, &semid_ds64);
 796                         eval = copyout(&semid_ds64, user_arg.buf, sizeof(semid_ds64));
 797                 } else {
 798                         struct user32_semid_ds semid_ds32;
 799                         bzero(&semid_ds32, sizeof(semid_ds32));
 800                         semid_ds_kernelto32(&semakptr->u, &semid_ds32);
 801                         eval = copyout(&semid_ds32, user_arg.buf, sizeof(semid_ds32));
 802                 }
 803                 break;
 804
 805         case GETNCNT:
 806                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 807                         goto semctlout;
 808                 }
 809                 if (semnum < 0 || semnum >= semakptr->u.sem_nsems) {
 810                         eval = EINVAL;
 811                         goto semctlout;
 812                 }
 813                 rval = semakptr->u.sem_base[semnum].semncnt;
 814                 break;
 815
 816         case GETPID:
 817                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 818                         goto semctlout;
 819                 }
 820                 if (semnum < 0 || semnum >= semakptr->u.sem_nsems) {
 821                         eval = EINVAL;
 822                         goto semctlout;
 823                 }
 824                 rval = semakptr->u.sem_base[semnum].sempid;
 825                 break;
 826
 827         case GETVAL:
 828                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 829                         goto semctlout;
 830                 }
 831                 if (semnum < 0 || semnum >= semakptr->u.sem_nsems) {
 832                         eval = EINVAL;
 833                         goto semctlout;
 834                 }
 835                 rval = semakptr->u.sem_base[semnum].semval;
 836                 break;
 837
 838         case GETALL:
 839                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 840                         goto semctlout;
 841                 }
 842 /* XXXXXXXXXXXXXXXX TBD XXXXXXXXXXXXXXXX */
 843                 for (i = 0; i < semakptr->u.sem_nsems; i++) {
 844                         /* XXX could be done in one go... */
 845                         eval = copyout((caddr_t)&semakptr->u.sem_base[i].semval,
 846                             user_arg.array + (i * sizeof(unsigned short)),
 847                             sizeof(unsigned short));
 848                         if (eval != 0) {
 849                                 break;
 850                         }
 851                 }
 852                 break;
 853
 854         case GETZCNT:
 855                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_R))) {
 856                         goto semctlout;
 857                 }
 858                 if (semnum < 0 || semnum >= semakptr->u.sem_nsems) {
 859                         eval = EINVAL;
 860                         goto semctlout;
 861                 }
 862                 rval = semakptr->u.sem_base[semnum].semzcnt;
 863                 break;
 864
 865         case SETVAL:
 866                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_W))) {
 867 #ifdef SEM_DEBUG
 868                         printf("Invalid credentials for write\n");
 869 #endif
 870                         goto semctlout;
 871                 }
 872                 if (semnum < 0 || semnum >= semakptr->u.sem_nsems) {
 873 #ifdef SEM_DEBUG
 874                         printf("Invalid number out of range for set\n");
 875 #endif
 876                         eval = EINVAL;
 877                         goto semctlout;
 878                 }
 879
 880                 /*
 881                  * Cast down a pointer instead of using 'val' member directly
 882                  * to avoid introducing endieness and a pad field into the
 883                  * header file.  Ugly, but it works.
 884                  */
 885                 u_int newsemval = CAST_DOWN_EXPLICIT(u_int, user_arg.buf);
 886
 887                 /*
 888                  * The check is being performed as unsigned values to match
 889                  * eventual destination
 890                  */
 891                 if (newsemval > (u_int)seminfo.semvmx) {
 892 #ifdef SEM_DEBUG
 893                         printf("Out of range sem value for set\n");
 894 #endif
 895                         eval = ERANGE;
 896                         goto semctlout;
 897                 }
 898                 semakptr->u.sem_base[semnum].semval = newsemval;
 899                 semakptr->u.sem_base[semnum].sempid = p->p_pid;
 900                 /* XXX scottl Should there be a MAC call here? */
 901                 semundo_clear(semid, semnum);
 902                 wakeup((caddr_t)semakptr);
 903                 break;
 904
 905         case SETALL:
 906                 if ((eval = ipcperm(cred, &semakptr->u.sem_perm, IPC_W))) {
 907                         goto semctlout;
 908                 }
 909 /*** XXXXXXXXXXXX TBD ********/
 910                 for (i = 0; i < semakptr->u.sem_nsems; i++) {
 911                         /* XXX could be done in one go... */
 912                         eval = copyin(user_arg.array + (i * sizeof(unsigned short)),
 913                             (caddr_t)&semakptr->u.sem_base[i].semval,
 914                             sizeof(unsigned short));
 915                         if (eval != 0) {
 916                                 break;
 917                         }
 918                         semakptr->u.sem_base[i].sempid = p->p_pid;
 919                 }
 920                 /* XXX scottl Should there be a MAC call here? */
 921                 semundo_clear(semid, -1);
 922                 wakeup((caddr_t)semakptr);
 923                 break;
 924
 925         default:
 926                 eval = EINVAL;
 927                 goto semctlout;
 928         }
 929
 930         if (eval == 0) {
 931                 *retval = rval;
 932         }
 933 semctlout:
 934         SYSV_SEM_SUBSYS_UNLOCK();
 935         return eval;
 936 }
 937
 938 int
 939 semget(__unused struct proc *p, struct semget_args *uap, int32_t *retval)
 940 {
 941         int semid, eval;
 942         int key = uap->key;
 943         int nsems = uap->nsems;
 944         int semflg = uap->semflg;
 945         kauth_cred_t cred = kauth_cred_get();
 946
 947 #ifdef SEM_DEBUG
 948         if (key != IPC_PRIVATE) {
 949                 printf("semget(0x%x, %d, 0%o)\n", key, nsems, semflg);
 950         } else {
 951                 printf("semget(IPC_PRIVATE, %d, 0%o)\n", nsems, semflg);
 952         }
 953 #endif
 954
 955
 956         SYSV_SEM_SUBSYS_LOCK();
 957
 958
 959         if (key != IPC_PRIVATE) {
 960                 for (semid = 0; semid < seminfo.semmni; semid++) {
 961                         if ((sema[semid].u.sem_perm.mode & SEM_ALLOC) &&
 962                             sema[semid].u.sem_perm._key == key) {
 963                                 break;
 964                         }
 965                 }
 966                 if (semid < seminfo.semmni) {
 967 #ifdef SEM_DEBUG
 968                         printf("found public key\n");
 969 #endif
 970                         if ((eval = ipcperm(cred, &sema[semid].u.sem_perm,
 971                             semflg & 0700))) {
 972                                 goto semgetout;
 973                         }
 974                         if (nsems < 0 || sema[semid].u.sem_nsems < nsems) {
 975 #ifdef SEM_DEBUG
 976                                 printf("too small\n");
 977 #endif
 978                                 eval = EINVAL;
 979                                 goto semgetout;
 980                         }
 981                         if ((semflg & IPC_CREAT) && (semflg & IPC_EXCL)) {
 982 #ifdef SEM_DEBUG
 983                                 printf("not exclusive\n");
 984 #endif
 985                                 eval = EEXIST;
 986                                 goto semgetout;
 987                         }
 988 #if CONFIG_MACF
 989                         eval = mac_sysvsem_check_semget(cred, &sema[semid]);
 990                         if (eval) {
 991                                 goto semgetout;
 992                         }
 993 #endif
 994                         goto found;
 995                 }
 996         }
 997
 998 #ifdef SEM_DEBUG
 999         printf("need to allocate an id for the request\n");
1000 #endif
1001         if (key == IPC_PRIVATE || (semflg & IPC_CREAT)) {
1002                 if (nsems <= 0 || nsems > limitseminfo.semmsl) {
1003 #ifdef SEM_DEBUG
1004                         printf("nsems out of range (0<%d<=%d)\n", nsems,
1005                             seminfo.semmsl);
1006 #endif
1007                         eval = EINVAL;
1008                         goto semgetout;
1009                 }
1010                 if (nsems > seminfo.semmns - semtot) {
1011 #ifdef SEM_DEBUG
1012                         printf("not enough semaphores left (need %d, got %d)\n",
1013                             nsems, seminfo.semmns - semtot);
1014 #endif
1015                         if (!grow_sem_pool(semtot + nsems)) {
1016 #ifdef SEM_DEBUG
1017                                 printf("failed to grow the sem array\n");
1018 #endif
1019                                 eval = ENOSPC;
1020                                 goto semgetout;
1021                         }
1022                 }
1023                 for (semid = 0; semid < seminfo.semmni; semid++) {
1024                         if ((sema[semid].u.sem_perm.mode & SEM_ALLOC) == 0) {
1025                                 break;
1026                         }
1027                 }
1028                 if (semid == seminfo.semmni) {
1029 #ifdef SEM_DEBUG
1030                         printf("no more id's available\n");
1031 #endif
1032                         if (!grow_sema_array(seminfo.semmni + 1)) {
1033 #ifdef SEM_DEBUG
1034                                 printf("failed to grow sema array\n");
1035 #endif
1036                                 eval = ENOSPC;
1037                                 goto semgetout;
1038                         }
1039                 }
1040 #ifdef SEM_DEBUG
1041                 printf("semid %d is available\n", semid);
1042 #endif
1043                 sema[semid].u.sem_perm._key = key;
1044                 sema[semid].u.sem_perm.cuid = kauth_cred_getuid(cred);
1045                 sema[semid].u.sem_perm.uid = kauth_cred_getuid(cred);
1046                 sema[semid].u.sem_perm.cgid = kauth_cred_getgid(cred);
1047                 sema[semid].u.sem_perm.gid = kauth_cred_getgid(cred);
1048                 sema[semid].u.sem_perm.mode = (semflg & 0777) | SEM_ALLOC;
1049                 sema[semid].u.sem_perm._seq =
1050                     (sema[semid].u.sem_perm._seq + 1) & 0x7fff;
1051                 sema[semid].u.sem_nsems = nsems;
1052                 sema[semid].u.sem_otime = 0;
1053                 sema[semid].u.sem_ctime = sysv_semtime();
1054                 sema[semid].u.sem_base = &sem_pool[semtot];
1055                 semtot += nsems;
1056                 bzero(sema[semid].u.sem_base,
1057                     sizeof(sema[semid].u.sem_base[0]) * nsems);
1058 #if CONFIG_MACF
1059                 mac_sysvsem_label_associate(cred, &sema[semid]);
1060 #endif
1061 #ifdef SEM_DEBUG
1062                 printf("sembase = 0x%x, next = 0x%x\n", sema[semid].u.sem_base,
1063                     &sem_pool[semtot]);
1064 #endif
1065         } else {
1066 #ifdef SEM_DEBUG
1067                 printf("didn't find it and wasn't asked to create it\n");
1068 #endif
1069                 eval = ENOENT;
1070                 goto semgetout;
1071         }
1072
1073 found:
1074         *retval = IXSEQ_TO_IPCID(semid, sema[semid].u.sem_perm);
1075         AUDIT_ARG(svipc_id, *retval);
1076 #ifdef SEM_DEBUG
1077         printf("semget is done, returning %d\n", *retval);
1078 #endif
1079         eval = 0;
1080
1081 semgetout:
1082         SYSV_SEM_SUBSYS_UNLOCK();
1083         return eval;
1084 }
1085
1086 int
1087 semop(struct proc *p, struct semop_args *uap, int32_t *retval)
1088 {
1089         int semid = uap->semid;
1090         int nsops = uap->nsops;
1091         struct sembuf sops[seminfo.semopm];
1092         struct semid_kernel *semakptr;
1093         struct sembuf *sopptr = NULL;   /* protected by 'semptr' */
1094         struct sem *semptr = NULL;      /* protected by 'if' */
1095         int supidx = -1;
1096         int i, j, eval;
1097         int do_wakeup, do_undos;
1098
1099         AUDIT_ARG(svipc_id, uap->semid);
1100
1101         SYSV_SEM_SUBSYS_LOCK();
1102
1103 #ifdef SEM_DEBUG
1104         printf("call to semop(%d, 0x%x, %d)\n", semid, sops, nsops);
1105 #endif
1106
1107         semid = IPCID_TO_IX(semid);     /* Convert back to zero origin */
1108
1109         if (semid < 0 || semid >= seminfo.semmni) {
1110                 eval = EINVAL;
1111                 goto semopout;
1112         }
1113
1114         semakptr = &sema[semid];
1115         if ((semakptr->u.sem_perm.mode & SEM_ALLOC) == 0) {
1116                 eval = EINVAL;
1117                 goto semopout;
1118         }
1119         if (semakptr->u.sem_perm._seq != IPCID_TO_SEQ(uap->semid)) {
1120                 eval = EINVAL;
1121                 goto semopout;
1122         }
1123
1124         if ((eval = ipcperm(kauth_cred_get(), &semakptr->u.sem_perm, IPC_W))) {
1125 #ifdef SEM_DEBUG
1126                 printf("eval = %d from ipaccess\n", eval);
1127 #endif
1128                 goto semopout;
1129         }
1130
1131         if (nsops < 0 || nsops > seminfo.semopm) {
1132 #ifdef SEM_DEBUG
1133                 printf("too many sops (max=%d, nsops=%d)\n",
1134                     seminfo.semopm, nsops);
1135 #endif
1136                 eval = E2BIG;
1137                 goto semopout;
1138         }
1139
1140         /*  OK for LP64, since sizeof(struct sembuf) is currently invariant */
1141         if ((eval = copyin(uap->sops, &sops, nsops * sizeof(struct sembuf))) != 0) {
1142 #ifdef SEM_DEBUG
1143                 printf("eval = %d from copyin(%08x, %08x, %ld)\n", eval,
1144                     uap->sops, &sops, nsops * sizeof(struct sembuf));
1145 #endif
1146                 goto semopout;
1147         }
1148
1149 #if CONFIG_MACF
1150         /*
1151          * Initial pass thru sops to see what permissions are needed.
1152          */
1153         j = 0;          /* permission needed */
1154         for (i = 0; i < nsops; i++) {
1155                 j |= (sops[i].sem_op == 0) ? SEM_R : SEM_A;
1156         }
1157
1158         /*
1159          * The MAC hook checks whether the thread has read (and possibly
1160          * write) permissions to the semaphore array based on the
1161          * sopptr->sem_op value.
1162          */
1163         eval = mac_sysvsem_check_semop(kauth_cred_get(), semakptr, j);
1164         if (eval) {
1165                 goto semopout;
1166         }
1167 #endif
1168
1169         /*
1170          * Loop trying to satisfy the vector of requests.
1171          * If we reach a point where we must wait, any requests already
1172          * performed are rolled back and we go to sleep until some other
1173          * process wakes us up.  At this point, we start all over again.
1174          *
1175          * This ensures that from the perspective of other tasks, a set
1176          * of requests is atomic (never partially satisfied).
1177          */
1178         do_undos = 0;
1179
1180         for (;;) {
1181                 do_wakeup = 0;
1182
1183                 for (i = 0; i < nsops; i++) {
1184                         sopptr = &sops[i];
1185
1186                         if (sopptr->sem_num >= semakptr->u.sem_nsems) {
1187                                 eval = EFBIG;
1188                                 goto semopout;
1189                         }
1190
1191                         semptr = &semakptr->u.sem_base[sopptr->sem_num];
1192
1193 #ifdef SEM_DEBUG
1194                         printf("semop:  semakptr=%x, sem_base=%x, semptr=%x, sem[%d]=%d : op=%d, flag=%s\n",
1195                             semakptr, semakptr->u.sem_base, semptr,
1196                             sopptr->sem_num, semptr->semval, sopptr->sem_op,
1197                             (sopptr->sem_flg & IPC_NOWAIT) ? "nowait" : "wait");
1198 #endif
1199
1200                         if (sopptr->sem_op < 0) {
1201                                 if (semptr->semval + sopptr->sem_op < 0) {
1202 #ifdef SEM_DEBUG
1203                                         printf("semop:  can't do it now\n");
1204 #endif
1205                                         break;
1206                                 } else {
1207                                         semptr->semval += sopptr->sem_op;
1208                                         if (semptr->semval == 0 &&
1209                                             semptr->semzcnt > 0) {
1210                                                 do_wakeup = 1;
1211                                         }
1212                                 }
1213                                 if (sopptr->sem_flg & SEM_UNDO) {
1214                                         do_undos = 1;
1215                                 }
1216                         } else if (sopptr->sem_op == 0) {
1217                                 if (semptr->semval > 0) {
1218 #ifdef SEM_DEBUG
1219                                         printf("semop:  not zero now\n");
1220 #endif
1221                                         break;
1222                                 }
1223                         } else {
1224                                 if (semptr->semncnt > 0) {
1225                                         do_wakeup = 1;
1226                                 }
1227                                 semptr->semval += sopptr->sem_op;
1228                                 if (sopptr->sem_flg & SEM_UNDO) {
1229                                         do_undos = 1;
1230                                 }
1231                         }
1232                 }
1233
1234                 /*
1235                  * Did we get through the entire vector?
1236                  */
1237                 if (i >= nsops) {
1238                         goto done;
1239                 }
1240
1241                 /*
1242                  * No ... rollback anything that we've already done
1243                  */
1244 #ifdef SEM_DEBUG
1245                 printf("semop:  rollback 0 through %d\n", i - 1);
1246 #endif
1247                 for (j = 0; j < i; j++) {
1248                         semakptr->u.sem_base[sops[j].sem_num].semval -=
1249                             sops[j].sem_op;
1250                 }
1251
1252                 /*
1253                  * If the request that we couldn't satisfy has the
1254                  * NOWAIT flag set then return with EAGAIN.
1255                  */
1256                 if (sopptr->sem_flg & IPC_NOWAIT) {
1257                         eval = EAGAIN;
1258                         goto semopout;
1259                 }
1260
1261                 if (sopptr->sem_op == 0) {
1262                         semptr->semzcnt++;
1263                 } else {
1264                         semptr->semncnt++;
1265                 }
1266
1267 #ifdef SEM_DEBUG
1268                 printf("semop:  good night!\n");
1269 #endif
1270                 /* Release our lock on the semaphore subsystem so
1271                  * another thread can get at the semaphore we are
1272                  * waiting for. We will get the lock back after we
1273                  * wake up.
1274                  */
1275                 eval = msleep((caddr_t)semakptr, &sysv_sem_subsys_mutex, (PZERO - 4) | PCATCH,
1276                     "semwait", 0);
1277
1278 #ifdef SEM_DEBUG
1279                 printf("semop:  good morning (eval=%d)!\n", eval);
1280 #endif
1281                 if (eval != 0) {
1282                         eval = EINTR;
1283                 }
1284
1285                 /*
1286                  * IMPORTANT: while we were asleep, the semaphore array might
1287                  * have been reallocated somewhere else (see grow_sema_array()).
1288                  * When we wake up, we have to re-lookup the semaphore
1289                  * structures and re-validate them.
1290                  */
1291
1292                 semptr = NULL;
1293
1294                 /*
1295                  * Make sure that the semaphore still exists
1296                  *
1297                  * XXX POSIX: Third test this 'if' and 'EINTR' precedence may
1298                  * fail testing; if so, we will need to revert this code.
1299                  */
1300                 semakptr = &sema[semid];   /* sema may have been reallocated */
1301                 if ((semakptr->u.sem_perm.mode & SEM_ALLOC) == 0 ||
1302                     semakptr->u.sem_perm._seq != IPCID_TO_SEQ(uap->semid) ||
1303                     sopptr->sem_num >= semakptr->u.sem_nsems) {
1304                         /* The man page says to return EIDRM. */
1305                         /* Unfortunately, BSD doesn't define that code! */
1306                         if (eval == EINTR) {
1307                                 /*
1308                                  * EINTR takes precedence over the fact that
1309                                  * the semaphore disappeared while we were
1310                                  * sleeping...
1311                                  */
1312                         } else {
1313 #ifdef EIDRM
1314                                 eval = EIDRM;
1315 #else
1316                                 eval = EINVAL;          /* Ancient past */
1317 #endif
1318                         }
1319                         goto semopout;
1320                 }
1321
1322                 /*
1323                  * The semaphore is still alive.  Readjust the count of
1324                  * waiting processes. semptr needs to be recomputed
1325                  * because the sem[] may have been reallocated while
1326                  * we were sleeping, updating our sem_base pointer.
1327                  */
1328                 semptr = &semakptr->u.sem_base[sopptr->sem_num];
1329                 if (sopptr->sem_op == 0) {
1330                         semptr->semzcnt--;
1331                 } else {
1332                         semptr->semncnt--;
1333                 }
1334
1335                 if (eval != 0) { /* EINTR */
1336                         goto semopout;
1337                 }
1338         }
1339
1340 done:
1341         /*
1342          * Process any SEM_UNDO requests.
1343          */
1344         if (do_undos) {
1345                 for (i = 0; i < nsops; i++) {
1346                         /*
1347                          * We only need to deal with SEM_UNDO's for non-zero
1348                          * op's.
1349                          */
1350                         int adjval;
1351
1352                         if ((sops[i].sem_flg & SEM_UNDO) == 0) {
1353                                 continue;
1354                         }
1355                         adjval = sops[i].sem_op;
1356                         if (adjval == 0) {
1357                                 continue;
1358                         }
1359                         eval = semundo_adjust(p, &supidx, semid,
1360                             sops[i].sem_num, -adjval);
1361                         if (eval == 0) {
1362                                 continue;
1363                         }
1364
1365                         /*
1366                          * Oh-Oh!  We ran out of either sem_undo's or undo's.
1367                          * Rollback the adjustments to this point and then
1368                          * rollback the semaphore ups and down so we can return
1369                          * with an error with all structures restored.  We
1370                          * rollback the undo's in the exact reverse order that
1371                          * we applied them.  This guarantees that we won't run
1372                          * out of space as we roll things back out.
1373                          */
1374                         for (j = i - 1; j >= 0; j--) {
1375                                 if ((sops[j].sem_flg & SEM_UNDO) == 0) {
1376                                         continue;
1377                                 }
1378                                 adjval = sops[j].sem_op;
1379                                 if (adjval == 0) {
1380                                         continue;
1381                                 }
1382                                 if (semundo_adjust(p, &supidx, semid,
1383                                     sops[j].sem_num, adjval) != 0) {
1384                                         panic("semop - can't undo undos");
1385                                 }
1386                         }
1387
1388                         for (j = 0; j < nsops; j++) {
1389                                 semakptr->u.sem_base[sops[j].sem_num].semval -=
1390                                     sops[j].sem_op;
1391                         }
1392
1393 #ifdef SEM_DEBUG
1394                         printf("eval = %d from semundo_adjust\n", eval);
1395 #endif
1396                         goto semopout;
1397                 } /* loop through the sops */
1398         } /* if (do_undos) */
1399
1400         /* We're definitely done - set the sempid's */
1401         for (i = 0; i < nsops; i++) {
1402                 sopptr = &sops[i];
1403                 semptr = &semakptr->u.sem_base[sopptr->sem_num];
1404                 semptr->sempid = p->p_pid;
1405         }
1406         semakptr->u.sem_otime = sysv_semtime();
1407
1408         if (do_wakeup) {
1409 #ifdef SEM_DEBUG
1410                 printf("semop:  doing wakeup\n");
1411 #ifdef SEM_WAKEUP
1412                 sem_wakeup((caddr_t)semakptr);
1413 #else
1414                 wakeup((caddr_t)semakptr);
1415 #endif
1416                 printf("semop:  back from wakeup\n");
1417 #else
1418                 wakeup((caddr_t)semakptr);
1419 #endif
1420         }
1421 #ifdef SEM_DEBUG
1422         printf("semop:  done\n");
1423 #endif
1424         *retval = 0;
1425         eval = 0;
1426 semopout:
1427         SYSV_SEM_SUBSYS_UNLOCK();
1428         return eval;
1429 }
1430
1431 /*
1432  * Go through the undo structures for this process and apply the adjustments to
1433  * semaphores.
1434  */
1435 void
1436 semexit(struct proc *p)
1437 {
1438         struct sem_undo *suptr = NULL;
1439         int suidx;
1440         int *supidx;
1441         int did_something;
1442
1443         /* If we have not allocated our semaphores yet there can't be
1444          * anything to undo, but we need the lock to prevent
1445          * dynamic memory race conditions.
1446          */
1447         SYSV_SEM_SUBSYS_LOCK();
1448
1449         if (!sem_pool) {
1450                 SYSV_SEM_SUBSYS_UNLOCK();
1451                 return;
1452         }
1453         did_something = 0;
1454
1455         /*
1456          * Go through the chain of undo vectors looking for one
1457          * associated with this process.
1458          */
1459
1460         for (supidx = &semu_list_idx; (suidx = *supidx) != -1;
1461             supidx = &suptr->un_next_idx) {
1462                 suptr = SEMU(suidx);
1463                 if (suptr->un_proc == p) {
1464                         break;
1465                 }
1466         }
1467
1468         if (suidx == -1) {
1469                 goto unlock;
1470         }
1471
1472 #ifdef SEM_DEBUG
1473         printf("proc @%08x has undo structure with %d entries\n", p,
1474             suptr->un_cnt);
1475 #endif
1476
1477         /*
1478          * If there are any active undo elements then process them.
1479          */
1480         if (suptr->un_cnt > 0) {
1481                 while (suptr->un_ent != NULL) {
1482                         struct undo *sueptr;
1483                         int semid;
1484                         int semnum;
1485                         int adjval;
1486                         struct semid_kernel *semakptr;
1487
1488                         sueptr = suptr->un_ent;
1489                         semid = sueptr->une_id;
1490                         semnum = sueptr->une_num;
1491                         adjval = sueptr->une_adjval;
1492
1493                         semakptr = &sema[semid];
1494                         if ((semakptr->u.sem_perm.mode & SEM_ALLOC) == 0) {
1495                                 panic("semexit - semid not allocated");
1496                         }
1497                         if (semnum >= semakptr->u.sem_nsems) {
1498                                 panic("semexit - semnum out of range");
1499                         }
1500
1501 #ifdef SEM_DEBUG
1502                         printf("semexit:  %08x id=%d num=%d(adj=%d) ; sem=%d\n",
1503                             suptr->un_proc,
1504                             semid,
1505                             semnum,
1506                             adjval,
1507                             semakptr->u.sem_base[semnum].semval);
1508 #endif
1509
1510                         if (adjval < 0) {
1511                                 if (semakptr->u.sem_base[semnum].semval < -adjval) {
1512                                         semakptr->u.sem_base[semnum].semval = 0;
1513                                 } else {
1514                                         semakptr->u.sem_base[semnum].semval +=
1515                                             adjval;
1516                                 }
1517                         } else {
1518                                 semakptr->u.sem_base[semnum].semval += adjval;
1519                         }
1520
1521                         /* Maybe we should build a list of semakptr's to wake
1522                          * up, finish all access to data structures, release the
1523                          * subsystem lock, and wake all the processes.  Something
1524                          * to think about.
1525                          */
1526 #ifdef SEM_WAKEUP
1527                         sem_wakeup((caddr_t)semakptr);
1528 #else
1529                         wakeup((caddr_t)semakptr);
1530 #endif
1531 #ifdef SEM_DEBUG
1532                         printf("semexit:  back from wakeup\n");
1533 #endif
1534                         suptr->un_cnt--;
1535                         suptr->un_ent = sueptr->une_next;
1536                         FREE(sueptr, M_SYSVSEM);
1537                         sueptr = NULL;
1538                 }
1539         }
1540
1541         /*
1542          * Deallocate the undo vector.
1543          */
1544 #ifdef SEM_DEBUG
1545         printf("removing vector\n");
1546 #endif
1547         suptr->un_proc = NULL;
1548         *supidx = suptr->un_next_idx;
1549
1550 unlock:
1551         /*
1552          * There is a semaphore leak (i.e. memory leak) in this code.
1553          * We should be deleting the IPC_PRIVATE semaphores when they are
1554          * no longer needed, and we dont. We would have to track which processes
1555          * know about which IPC_PRIVATE semaphores, updating the list after
1556          * every fork.  We can't just delete them semaphore when the process
1557          * that created it dies, because that process may well have forked
1558          * some children.  So we need to wait until all of it's children have
1559          * died, and so on.  Maybe we should tag each IPC_PRIVATE sempahore
1560          * with the creating group ID, count the number of processes left in
1561          * that group, and delete the semaphore when the group is gone.
1562          * Until that code gets implemented we will leak IPC_PRIVATE semaphores.
1563          * There is an upper bound on the size of our semaphore array, so
1564          * leaking the semaphores should not work as a DOS attack.
1565          *
1566          * Please note that the original BSD code this file is based on had the
1567          * same leaky semaphore problem.
1568          */
1569
1570         SYSV_SEM_SUBSYS_UNLOCK();
1571 }
1572
1573
1574 /* (struct sysctl_oid *oidp, void *arg1, int arg2, \
1575  *       struct sysctl_req *req) */
1576 static int
1577 sysctl_seminfo(__unused struct sysctl_oid *oidp, void *arg1,
1578     __unused int arg2, struct sysctl_req *req)
1579 {
1580         int error = 0;
1581
1582         error = SYSCTL_OUT(req, arg1, sizeof(int));
1583         if (error || req->newptr == USER_ADDR_NULL) {
1584                 return error;
1585         }
1586
1587         SYSV_SEM_SUBSYS_LOCK();
1588
1589         /* Set the values only if shared memory is not initialised */
1590         if ((sem_pool == NULL) &&
1591             (sema == NULL) &&
1592             (semu == NULL) &&
1593             (semu_list_idx == -1)) {
1594                 if ((error = SYSCTL_IN(req, arg1, sizeof(int)))) {
1595                         goto out;
1596                 }
1597         } else {
1598                 error = EINVAL;
1599         }
1600 out:
1601         SYSV_SEM_SUBSYS_UNLOCK();
1602         return error;
1603 }
1604
1605 /* SYSCTL_NODE(_kern, KERN_SYSV, sysv, CTLFLAG_RW, 0, "SYSV"); */
1606 extern struct sysctl_oid_list sysctl__kern_sysv_children;
1607 SYSCTL_PROC(_kern_sysv, OID_AUTO, semmni, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
1608     &limitseminfo.semmni, 0, &sysctl_seminfo, "I", "semmni");
1609
1610 SYSCTL_PROC(_kern_sysv, OID_AUTO, semmns, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
1611     &limitseminfo.semmns, 0, &sysctl_seminfo, "I", "semmns");
1612
1613 SYSCTL_PROC(_kern_sysv, OID_AUTO, semmnu, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
1614     &limitseminfo.semmnu, 0, &sysctl_seminfo, "I", "semmnu");
1615
1616 SYSCTL_PROC(_kern_sysv, OID_AUTO, semmsl, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
1617     &limitseminfo.semmsl, 0, &sysctl_seminfo, "I", "semmsl");
1618
1619 SYSCTL_PROC(_kern_sysv, OID_AUTO, semume, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
1620     &limitseminfo.semume, 0, &sysctl_seminfo, "I", "semume");
1621
1622
1623 static int
1624 IPCS_sem_sysctl(__unused struct sysctl_oid *oidp, __unused void *arg1,
1625     __unused int arg2, struct sysctl_req *req)
1626 {
1627         int error;
1628         int cursor;
1629         union {
1630                 struct user32_IPCS_command u32;
1631                 struct user_IPCS_command u64;
1632         } ipcs;
1633         struct user32_semid_ds semid_ds32;      /* post conversion, 32 bit version */
1634         struct user64_semid_ds semid_ds64;      /* post conversion, 64 bit version */
1635         void *semid_dsp;
1636         size_t ipcs_sz;
1637         size_t semid_ds_sz;
1638         struct proc *p = current_proc();
1639
1640         if (IS_64BIT_PROCESS(p)) {
1641                 ipcs_sz = sizeof(struct user_IPCS_command);
1642                 semid_ds_sz = sizeof(struct user64_semid_ds);
1643         } else {
1644                 ipcs_sz = sizeof(struct user32_IPCS_command);
1645                 semid_ds_sz = sizeof(struct user32_semid_ds);
1646         }
1647
1648         /* Copy in the command structure */
1649         if ((error = SYSCTL_IN(req, &ipcs, ipcs_sz)) != 0) {
1650                 return error;
1651         }
1652
1653         if (!IS_64BIT_PROCESS(p)) { /* convert in place */
1654                 ipcs.u64.ipcs_data = CAST_USER_ADDR_T(ipcs.u32.ipcs_data);
1655         }
1656
1657         /* Let us version this interface... */
1658         if (ipcs.u64.ipcs_magic != IPCS_MAGIC) {
1659                 return EINVAL;
1660         }
1661
1662         SYSV_SEM_SUBSYS_LOCK();
1663         switch (ipcs.u64.ipcs_op) {
1664         case IPCS_SEM_CONF:     /* Obtain global configuration data */
1665                 if (ipcs.u64.ipcs_datalen != sizeof(struct seminfo)) {
1666                         error = ERANGE;
1667                         break;
1668                 }
1669                 if (ipcs.u64.ipcs_cursor != 0) {        /* fwd. compat. */
1670                         error = EINVAL;
1671                         break;
1672                 }
1673                 error = copyout(&seminfo, ipcs.u64.ipcs_data, ipcs.u64.ipcs_datalen);
1674                 break;
1675
1676         case IPCS_SEM_ITER:     /* Iterate over existing segments */
1677                 cursor = ipcs.u64.ipcs_cursor;
1678                 if (cursor < 0 || cursor >= seminfo.semmni) {
1679                         error = ERANGE;
1680                         break;
1681                 }
1682                 if (ipcs.u64.ipcs_datalen != (int)semid_ds_sz) {
1683                         error = EINVAL;
1684                         break;
1685                 }
1686                 for (; cursor < seminfo.semmni; cursor++) {
1687                         if (sema[cursor].u.sem_perm.mode & SEM_ALLOC) {
1688                                 break;
1689                         }
1690                         continue;
1691                 }
1692                 if (cursor == seminfo.semmni) {
1693                         error = ENOENT;
1694                         break;
1695                 }
1696
1697                 semid_dsp = &sema[cursor].u;    /* default: 64 bit */
1698
1699                 /*
1700                  * If necessary, convert the 64 bit kernel segment
1701                  * descriptor to a 32 bit user one.
1702                  */
1703                 if (!IS_64BIT_PROCESS(p)) {
1704                         bzero(&semid_ds32, sizeof(semid_ds32));
1705                         semid_ds_kernelto32(semid_dsp, &semid_ds32);
1706                         semid_dsp = &semid_ds32;
1707                 } else {
1708                         bzero(&semid_ds64, sizeof(semid_ds64));
1709                         semid_ds_kernelto64(semid_dsp, &semid_ds64);
1710                         semid_dsp = &semid_ds64;
1711                 }
1712
1713                 error = copyout(semid_dsp, ipcs.u64.ipcs_data, ipcs.u64.ipcs_datalen);
1714                 if (!error) {
1715                         /* update cursor */
1716                         ipcs.u64.ipcs_cursor = cursor + 1;
1717
1718                         if (!IS_64BIT_PROCESS(p)) {     /* convert in place */
1719                                 ipcs.u32.ipcs_data = CAST_DOWN_EXPLICIT(user32_addr_t, ipcs.u64.ipcs_data);
1720                         }
1721
1722                         error = SYSCTL_OUT(req, &ipcs, ipcs_sz);
1723                 }
1724                 break;
1725
1726         default:
1727                 error = EINVAL;
1728                 break;
1729         }
1730         SYSV_SEM_SUBSYS_UNLOCK();
1731         return error;
1732 }
1733
1734 SYSCTL_DECL(_kern_sysv_ipcs);
1735 SYSCTL_PROC(_kern_sysv_ipcs, OID_AUTO, sem, CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
1736     0, 0, IPCS_sem_sysctl,
1737     "S,IPCS_sem_command",
1738     "ipcs sem command interface");
1739
1740 #endif /* SYSV_SEM */