libgo/runtime/proc.c

   1 // Copyright 2009 The Go Authors. All rights reserved.
   2 // Use of this source code is governed by a BSD-style
   3 // license that can be found in the LICENSE file.
   4
   5 #include <limits.h>
   6 #include <signal.h>
   7 #include <stdlib.h>
   8 #include <pthread.h>
   9 #include <unistd.h>
  10
  11 #include "config.h"
  12
  13 #ifdef HAVE_DL_ITERATE_PHDR
  14 #include <link.h>
  15 #endif
  16
  17 #include "runtime.h"
  18 #include "arch.h"
  19 #include "defs.h"
  20 #include "malloc.h"
  21 #include "race.h"
  22 #include "go-type.h"
  23 #include "go-defer.h"
  24
  25 #ifdef USING_SPLIT_STACK
  26
  27 /* FIXME: These are not declared anywhere.  */
  28
  29 extern void __splitstack_getcontext(void *context[10]);
  30
  31 extern void __splitstack_setcontext(void *context[10]);
  32
  33 extern void *__splitstack_makecontext(size_t, void *context[10], size_t *);
  34
  35 extern void * __splitstack_resetcontext(void *context[10], size_t *);
  36
  37 extern void *__splitstack_find(void *, void *, size_t *, void **, void **,
  38                                void **);
  39
  40 extern void __splitstack_block_signals (int *, int *);
  41
  42 extern void __splitstack_block_signals_context (void *context[10], int *,
  43                                                 int *);
  44
  45 #endif
  46
  47 #ifndef PTHREAD_STACK_MIN
  48 # define PTHREAD_STACK_MIN 8192
  49 #endif
  50
  51 #if defined(USING_SPLIT_STACK) && defined(LINKER_SUPPORTS_SPLIT_STACK)
  52 # define StackMin PTHREAD_STACK_MIN
  53 #else
  54 # define StackMin 2 * 1024 * 1024
  55 #endif
  56
  57 uintptr runtime_stacks_sys;
  58
  59 static void schedule(G*);
  60
  61 static void gtraceback(G*);
  62
  63 typedef struct Sched Sched;
  64
  65 M       runtime_m0;
  66 G       runtime_g0;     // idle goroutine for m0
  67
  68 #ifdef __rtems__
  69 #define __thread
  70 #endif
  71
  72 static __thread G *g;
  73 static __thread M *m;
  74
  75 #ifndef SETCONTEXT_CLOBBERS_TLS
  76
  77 static inline void
  78 initcontext(void)
  79 {
  80 }
  81
  82 static inline void
  83 fixcontext(ucontext_t *c __attribute__ ((unused)))
  84 {
  85 }
  86
  87 #else
  88
  89 # if defined(__x86_64__) && defined(__sun__)
  90
  91 // x86_64 Solaris 10 and 11 have a bug: setcontext switches the %fs
  92 // register to that of the thread which called getcontext.  The effect
  93 // is that the address of all __thread variables changes.  This bug
  94 // also affects pthread_self() and pthread_getspecific.  We work
  95 // around it by clobbering the context field directly to keep %fs the
  96 // same.
  97
  98 static __thread greg_t fs;
  99
 100 static inline void
 101 initcontext(void)
 102 {
 103         ucontext_t c;
 104
 105         getcontext(&c);
 106         fs = c.uc_mcontext.gregs[REG_FSBASE];
 107 }
 108
 109 static inline void
 110 fixcontext(ucontext_t* c)
 111 {
 112         c->uc_mcontext.gregs[REG_FSBASE] = fs;
 113 }
 114
 115 # elif defined(__NetBSD__)
 116
 117 // NetBSD has a bug: setcontext clobbers tlsbase, we need to save
 118 // and restore it ourselves.
 119
 120 static __thread __greg_t tlsbase;
 121
 122 static inline void
 123 initcontext(void)
 124 {
 125         ucontext_t c;
 126
 127         getcontext(&c);
 128         tlsbase = c.uc_mcontext._mc_tlsbase;
 129 }
 130
 131 static inline void
 132 fixcontext(ucontext_t* c)
 133 {
 134         c->uc_mcontext._mc_tlsbase = tlsbase;
 135 }
 136
 137 # else
 138
 139 #  error unknown case for SETCONTEXT_CLOBBERS_TLS
 140
 141 # endif
 142
 143 #endif
 144
 145 // We can not always refer to the TLS variables directly.  The
 146 // compiler will call tls_get_addr to get the address of the variable,
 147 // and it may hold it in a register across a call to schedule.  When
 148 // we get back from the call we may be running in a different thread,
 149 // in which case the register now points to the TLS variable for a
 150 // different thread.  We use non-inlinable functions to avoid this
 151 // when necessary.
 152
 153 G* runtime_g(void) __attribute__ ((noinline, no_split_stack));
 154
 155 G*
 156 runtime_g(void)
 157 {
 158         return g;
 159 }
 160
 161 M* runtime_m(void) __attribute__ ((noinline, no_split_stack));
 162
 163 M*
 164 runtime_m(void)
 165 {
 166         return m;
 167 }
 168
 169 int32   runtime_gcwaiting;
 170
 171 G*      runtime_allg;
 172 G*      runtime_lastg;
 173 M*      runtime_allm;
 174
 175 int8*   runtime_goos;
 176 int32   runtime_ncpu;
 177
 178 // The static TLS size.  See runtime_newm.
 179 static int tlssize;
 180
 181 #ifdef HAVE_DL_ITERATE_PHDR
 182
 183 // Called via dl_iterate_phdr.
 184
 185 static int
 186 addtls(struct dl_phdr_info* info, size_t size __attribute__ ((unused)), void *data)
 187 {
 188         size_t *total = (size_t *)data;
 189         unsigned int i;
 190
 191         for(i = 0; i < info->dlpi_phnum; ++i) {
 192                 if(info->dlpi_phdr[i].p_type == PT_TLS)
 193                         *total += info->dlpi_phdr[i].p_memsz;
 194         }
 195         return 0;
 196 }
 197
 198 // Set the total TLS size.
 199
 200 static void
 201 inittlssize()
 202 {
 203         size_t total = 0;
 204
 205         dl_iterate_phdr(addtls, (void *)&total);
 206         tlssize = total;
 207 }
 208
 209 #else
 210
 211 static void
 212 inittlssize()
 213 {
 214 }
 215
 216 #endif
 217
 218 // Go scheduler
 219 //
 220 // The go scheduler's job is to match ready-to-run goroutines (`g's)
 221 // with waiting-for-work schedulers (`m's).  If there are ready g's
 222 // and no waiting m's, ready() will start a new m running in a new
 223 // OS thread, so that all ready g's can run simultaneously, up to a limit.
 224 // For now, m's never go away.
 225 //
 226 // By default, Go keeps only one kernel thread (m) running user code
 227 // at a single time; other threads may be blocked in the operating system.
 228 // Setting the environment variable $GOMAXPROCS or calling
 229 // runtime.GOMAXPROCS() will change the number of user threads
 230 // allowed to execute simultaneously.  $GOMAXPROCS is thus an
 231 // approximation of the maximum number of cores to use.
 232 //
 233 // Even a program that can run without deadlock in a single process
 234 // might use more m's if given the chance.  For example, the prime
 235 // sieve will use as many m's as there are primes (up to runtime_sched.mmax),
 236 // allowing different stages of the pipeline to execute in parallel.
 237 // We could revisit this choice, only kicking off new m's for blocking
 238 // system calls, but that would limit the amount of parallel computation
 239 // that go would try to do.
 240 //
 241 // In general, one could imagine all sorts of refinements to the
 242 // scheduler, but the goal now is just to get something working on
 243 // Linux and OS X.
 244
 245 struct Sched {
 246         Lock;
 247
 248         G *gfree;       // available g's (status == Gdead)
 249         int64 goidgen;
 250
 251         G *ghead;       // g's waiting to run
 252         G *gtail;
 253         int32 gwait;    // number of g's waiting to run
 254         int32 gcount;   // number of g's that are alive
 255         int32 grunning; // number of g's running on cpu or in syscall
 256
 257         M *mhead;       // m's waiting for work
 258         int32 mwait;    // number of m's waiting for work
 259         int32 mcount;   // number of m's that have been created
 260
 261         volatile uint32 atomic; // atomic scheduling word (see below)
 262
 263         int32 profilehz;        // cpu profiling rate
 264
 265         bool init;  // running initialization
 266         bool lockmain;  // init called runtime.LockOSThread
 267
 268         Note    stopped;        // one g can set waitstop and wait here for m's to stop
 269 };
 270
 271 // The atomic word in sched is an atomic uint32 that
 272 // holds these fields.
 273 //
 274 //      [15 bits] mcpu          number of m's executing on cpu
 275 //      [15 bits] mcpumax       max number of m's allowed on cpu
 276 //      [1 bit] waitstop        some g is waiting on stopped
 277 //      [1 bit] gwaiting        gwait != 0
 278 //
 279 // These fields are the information needed by entersyscall
 280 // and exitsyscall to decide whether to coordinate with the
 281 // scheduler.  Packing them into a single machine word lets
 282 // them use a fast path with a single atomic read/write and
 283 // no lock/unlock.  This greatly reduces contention in
 284 // syscall- or cgo-heavy multithreaded programs.
 285 //
 286 // Except for entersyscall and exitsyscall, the manipulations
 287 // to these fields only happen while holding the schedlock,
 288 // so the routines holding schedlock only need to worry about
 289 // what entersyscall and exitsyscall do, not the other routines
 290 // (which also use the schedlock).
 291 //
 292 // In particular, entersyscall and exitsyscall only read mcpumax,
 293 // waitstop, and gwaiting.  They never write them.  Thus, writes to those
 294 // fields can be done (holding schedlock) without fear of write conflicts.
 295 // There may still be logic conflicts: for example, the set of waitstop must
 296 // be conditioned on mcpu >= mcpumax or else the wait may be a
 297 // spurious sleep.  The Promela model in proc.p verifies these accesses.
 298 enum {
 299         mcpuWidth = 15,
 300         mcpuMask = (1<<mcpuWidth) - 1,
 301         mcpuShift = 0,
 302         mcpumaxShift = mcpuShift + mcpuWidth,
 303         waitstopShift = mcpumaxShift + mcpuWidth,
 304         gwaitingShift = waitstopShift+1,
 305
 306         // The max value of GOMAXPROCS is constrained
 307         // by the max value we can store in the bit fields
 308         // of the atomic word.  Reserve a few high values
 309         // so that we can detect accidental decrement
 310         // beyond zero.
 311         maxgomaxprocs = mcpuMask - 10,
 312 };
 313
 314 #define atomic_mcpu(v)          (((v)>>mcpuShift)&mcpuMask)
 315 #define atomic_mcpumax(v)       (((v)>>mcpumaxShift)&mcpuMask)
 316 #define atomic_waitstop(v)      (((v)>>waitstopShift)&1)
 317 #define atomic_gwaiting(v)      (((v)>>gwaitingShift)&1)
 318
 319 Sched runtime_sched;
 320 int32 runtime_gomaxprocs;
 321 bool runtime_singleproc;
 322
 323 static bool canaddmcpu(void);
 324
 325 // An m that is waiting for notewakeup(&m->havenextg).  This may
 326 // only be accessed while the scheduler lock is held.  This is used to
 327 // minimize the number of times we call notewakeup while the scheduler
 328 // lock is held, since the m will normally move quickly to lock the
 329 // scheduler itself, producing lock contention.
 330 static M* mwakeup;
 331
 332 // Scheduling helpers.  Sched must be locked.
 333 static void gput(G*);   // put/get on ghead/gtail
 334 static G* gget(void);
 335 static void mput(M*);   // put/get on mhead
 336 static M* mget(G*);
 337 static void gfput(G*);  // put/get on gfree
 338 static G* gfget(void);
 339 static void matchmg(void);      // match m's to g's
 340 static void readylocked(G*);    // ready, but sched is locked
 341 static void mnextg(M*, G*);
 342 static void mcommoninit(M*);
 343
 344 void
 345 setmcpumax(uint32 n)
 346 {
 347         uint32 v, w;
 348
 349         for(;;) {
 350                 v = runtime_sched.atomic;
 351                 w = v;
 352                 w &= ~(mcpuMask<<mcpumaxShift);
 353                 w |= n<<mcpumaxShift;
 354                 if(runtime_cas(&runtime_sched.atomic, v, w))
 355                         break;
 356         }
 357 }
 358
 359 // First function run by a new goroutine.  This replaces gogocall.
 360 static void
 361 kickoff(void)
 362 {
 363         void (*fn)(void*);
 364
 365         if(g->traceback != nil)
 366                 gtraceback(g);
 367
 368         fn = (void (*)(void*))(g->entry);
 369         fn(g->param);
 370         runtime_goexit();
 371 }
 372
 373 // Switch context to a different goroutine.  This is like longjmp.
 374 static void runtime_gogo(G*) __attribute__ ((noinline));
 375 static void
 376 runtime_gogo(G* newg)
 377 {
 378 #ifdef USING_SPLIT_STACK
 379         __splitstack_setcontext(&newg->stack_context[0]);
 380 #endif
 381         g = newg;
 382         newg->fromgogo = true;
 383         fixcontext(&newg->context);
 384         setcontext(&newg->context);
 385         runtime_throw("gogo setcontext returned");
 386 }
 387
 388 // Save context and call fn passing g as a parameter.  This is like
 389 // setjmp.  Because getcontext always returns 0, unlike setjmp, we use
 390 // g->fromgogo as a code.  It will be true if we got here via
 391 // setcontext.  g == nil the first time this is called in a new m.
 392 static void runtime_mcall(void (*)(G*)) __attribute__ ((noinline));
 393 static void
 394 runtime_mcall(void (*pfn)(G*))
 395 {
 396         M *mp;
 397         G *gp;
 398 #ifndef USING_SPLIT_STACK
 399         int i;
 400 #endif
 401
 402         // Ensure that all registers are on the stack for the garbage
 403         // collector.
 404         __builtin_unwind_init();
 405
 406         mp = m;
 407         gp = g;
 408         if(gp == mp->g0)
 409                 runtime_throw("runtime: mcall called on m->g0 stack");
 410
 411         if(gp != nil) {
 412
 413 #ifdef USING_SPLIT_STACK
 414                 __splitstack_getcontext(&g->stack_context[0]);
 415 #else
 416                 gp->gcnext_sp = &i;
 417 #endif
 418                 gp->fromgogo = false;
 419                 getcontext(&gp->context);
 420
 421                 // When we return from getcontext, we may be running
 422                 // in a new thread.  That means that m and g may have
 423                 // changed.  They are global variables so we will
 424                 // reload them, but the addresses of m and g may be
 425                 // cached in our local stack frame, and those
 426                 // addresses may be wrong.  Call functions to reload
 427                 // the values for this thread.
 428                 mp = runtime_m();
 429                 gp = runtime_g();
 430
 431                 if(gp->traceback != nil)
 432                         gtraceback(gp);
 433         }
 434         if (gp == nil || !gp->fromgogo) {
 435 #ifdef USING_SPLIT_STACK
 436                 __splitstack_setcontext(&mp->g0->stack_context[0]);
 437 #endif
 438                 mp->g0->entry = (byte*)pfn;
 439                 mp->g0->param = gp;
 440
 441                 // It's OK to set g directly here because this case
 442                 // can not occur if we got here via a setcontext to
 443                 // the getcontext call just above.
 444                 g = mp->g0;
 445
 446                 fixcontext(&mp->g0->context);
 447                 setcontext(&mp->g0->context);
 448                 runtime_throw("runtime: mcall function returned");
 449         }
 450 }
 451
 452 // Keep trace of scavenger's goroutine for deadlock detection.
 453 static G *scvg;
 454
 455 // The bootstrap sequence is:
 456 //
 457 //      call osinit
 458 //      call schedinit
 459 //      make & queue new G
 460 //      call runtime_mstart
 461 //
 462 // The new G calls runtime_main.
 463 void
 464 runtime_schedinit(void)
 465 {
 466         int32 n;
 467         const byte *p;
 468
 469         m = &runtime_m0;
 470         g = &runtime_g0;
 471         m->g0 = g;
 472         m->curg = g;
 473         g->m = m;
 474
 475         initcontext();
 476         inittlssize();
 477
 478         m->nomemprof++;
 479         runtime_mallocinit();
 480         mcommoninit(m);
 481
 482         runtime_goargs();
 483         runtime_goenvs();
 484
 485         // For debugging:
 486         // Allocate internal symbol table representation now,
 487         // so that we don't need to call malloc when we crash.
 488         // runtime_findfunc(0);
 489
 490         runtime_gomaxprocs = 1;
 491         p = runtime_getenv("GOMAXPROCS");
 492         if(p != nil && (n = runtime_atoi(p)) != 0) {
 493                 if(n > maxgomaxprocs)
 494                         n = maxgomaxprocs;
 495                 runtime_gomaxprocs = n;
 496         }
 497         // wait for the main goroutine to start before taking
 498         // GOMAXPROCS into account.
 499         setmcpumax(1);
 500         runtime_singleproc = runtime_gomaxprocs == 1;
 501
 502         canaddmcpu();   // mcpu++ to account for bootstrap m
 503         m->helpgc = 1;  // flag to tell schedule() to mcpu--
 504         runtime_sched.grunning++;
 505
 506         // Can not enable GC until all roots are registered.
 507         // mstats.enablegc = 1;
 508         m->nomemprof--;
 509
 510         if(raceenabled)
 511                 runtime_raceinit();
 512 }
 513
 514 extern void main_init(void) __asm__ (GOSYM_PREFIX "__go_init_main");
 515 extern void main_main(void) __asm__ (GOSYM_PREFIX "main.main");
 516
 517 // The main goroutine.
 518 void
 519 runtime_main(void)
 520 {
 521         // Lock the main goroutine onto this, the main OS thread,
 522         // during initialization.  Most programs won't care, but a few
 523         // do require certain calls to be made by the main thread.
 524         // Those can arrange for main.main to run in the main thread
 525         // by calling runtime.LockOSThread during initialization
 526         // to preserve the lock.
 527         runtime_LockOSThread();
 528         // From now on, newgoroutines may use non-main threads.
 529         setmcpumax(runtime_gomaxprocs);
 530         runtime_sched.init = true;
 531         scvg = __go_go(runtime_MHeap_Scavenger, nil);
 532         scvg->issystem = true;
 533         main_init();
 534         runtime_sched.init = false;
 535         if(!runtime_sched.lockmain)
 536                 runtime_UnlockOSThread();
 537
 538         // For gccgo we have to wait until after main is initialized
 539         // to enable GC, because initializing main registers the GC
 540         // roots.
 541         mstats.enablegc = 1;
 542
 543         // The deadlock detection has false negatives.
 544         // Let scvg start up, to eliminate the false negative
 545         // for the trivial program func main() { select{} }.
 546         runtime_gosched();
 547
 548         main_main();
 549         if(raceenabled)
 550                 runtime_racefini();
 551         runtime_exit(0);
 552         for(;;)
 553                 *(int32*)0 = 0;
 554 }
 555
 556 // Lock the scheduler.
 557 static void
 558 schedlock(void)
 559 {
 560         runtime_lock(&runtime_sched);
 561 }
 562
 563 // Unlock the scheduler.
 564 static void
 565 schedunlock(void)
 566 {
 567         M *mp;
 568
 569         mp = mwakeup;
 570         mwakeup = nil;
 571         runtime_unlock(&runtime_sched);
 572         if(mp != nil)
 573                 runtime_notewakeup(&mp->havenextg);
 574 }
 575
 576 void
 577 runtime_goexit(void)
 578 {
 579         g->status = Gmoribund;
 580         runtime_gosched();
 581 }
 582
 583 void
 584 runtime_goroutineheader(G *gp)
 585 {
 586         const char *status;
 587
 588         switch(gp->status) {
 589         case Gidle:
 590                 status = "idle";
 591                 break;
 592         case Grunnable:
 593                 status = "runnable";
 594                 break;
 595         case Grunning:
 596                 status = "running";
 597                 break;
 598         case Gsyscall:
 599                 status = "syscall";
 600                 break;
 601         case Gwaiting:
 602                 if(gp->waitreason)
 603                         status = gp->waitreason;
 604                 else
 605                         status = "waiting";
 606                 break;
 607         case Gmoribund:
 608                 status = "moribund";
 609                 break;
 610         default:
 611                 status = "???";
 612                 break;
 613         }
 614         runtime_printf("goroutine %D [%s]:\n", gp->goid, status);
 615 }
 616
 617 void
 618 runtime_goroutinetrailer(G *g)
 619 {
 620         if(g != nil && g->gopc != 0 && g->goid != 1) {
 621                 String fn;
 622                 String file;
 623                 intgo line;
 624
 625                 if(__go_file_line(g->gopc - 1, &fn, &file, &line)) {
 626                         runtime_printf("created by %S\n", fn);
 627                         runtime_printf("\t%S:%D\n", file, (int64) line);
 628                 }
 629         }
 630 }
 631
 632 struct Traceback
 633 {
 634         G* gp;
 635         Location locbuf[100];
 636         int32 c;
 637 };
 638
 639 void
 640 runtime_tracebackothers(G * volatile me)
 641 {
 642         G * volatile gp;
 643         Traceback tb;
 644         int32 traceback;
 645
 646         tb.gp = me;
 647         traceback = runtime_gotraceback();
 648         for(gp = runtime_allg; gp != nil; gp = gp->alllink) {
 649                 if(gp == me || gp->status == Gdead)
 650                         continue;
 651                 if(gp->issystem && traceback < 2)
 652                         continue;
 653                 runtime_printf("\n");
 654                 runtime_goroutineheader(gp);
 655
 656                 // Our only mechanism for doing a stack trace is
 657                 // _Unwind_Backtrace.  And that only works for the
 658                 // current thread, not for other random goroutines.
 659                 // So we need to switch context to the goroutine, get
 660                 // the backtrace, and then switch back.
 661
 662                 // This means that if g is running or in a syscall, we
 663                 // can't reliably print a stack trace.  FIXME.
 664                 if(gp->status == Gsyscall || gp->status == Grunning) {
 665                         runtime_printf("no stack trace available\n");
 666                         runtime_goroutinetrailer(gp);
 667                         continue;
 668                 }
 669
 670                 gp->traceback = &tb;
 671
 672 #ifdef USING_SPLIT_STACK
 673                 __splitstack_getcontext(&me->stack_context[0]);
 674 #endif
 675                 getcontext(&me->context);
 676
 677                 if(gp->traceback != nil) {
 678                         runtime_gogo(gp);
 679                 }
 680
 681                 runtime_printtrace(tb.locbuf, tb.c, false);
 682                 runtime_goroutinetrailer(gp);
 683         }
 684 }
 685
 686 // Do a stack trace of gp, and then restore the context to
 687 // gp->dotraceback.
 688
 689 static void
 690 gtraceback(G* gp)
 691 {
 692         Traceback* traceback;
 693
 694         traceback = gp->traceback;
 695         gp->traceback = nil;
 696         traceback->c = runtime_callers(1, traceback->locbuf,
 697                 sizeof traceback->locbuf / sizeof traceback->locbuf[0]);
 698         runtime_gogo(traceback->gp);
 699 }
 700
 701 // Mark this g as m's idle goroutine.
 702 // This functionality might be used in environments where programs
 703 // are limited to a single thread, to simulate a select-driven
 704 // network server.  It is not exposed via the standard runtime API.
 705 void
 706 runtime_idlegoroutine(void)
 707 {
 708         if(g->idlem != nil)
 709                 runtime_throw("g is already an idle goroutine");
 710         g->idlem = m;
 711 }
 712
 713 static void
 714 mcommoninit(M *mp)
 715 {
 716         mp->id = runtime_sched.mcount++;
 717         mp->fastrand = 0x49f6428aUL + mp->id + runtime_cputicks();
 718
 719         if(mp->mcache == nil)
 720                 mp->mcache = runtime_allocmcache();
 721
 722         runtime_callers(1, mp->createstack, nelem(mp->createstack));
 723
 724         // Add to runtime_allm so garbage collector doesn't free m
 725         // when it is just in a register or thread-local storage.
 726         mp->alllink = runtime_allm;
 727         // runtime_NumCgoCall() iterates over allm w/o schedlock,
 728         // so we need to publish it safely.
 729         runtime_atomicstorep(&runtime_allm, mp);
 730 }
 731
 732 // Try to increment mcpu.  Report whether succeeded.
 733 static bool
 734 canaddmcpu(void)
 735 {
 736         uint32 v;
 737
 738         for(;;) {
 739                 v = runtime_sched.atomic;
 740                 if(atomic_mcpu(v) >= atomic_mcpumax(v))
 741                         return 0;
 742                 if(runtime_cas(&runtime_sched.atomic, v, v+(1<<mcpuShift)))
 743                         return 1;
 744         }
 745 }
 746
 747 // Put on `g' queue.  Sched must be locked.
 748 static void
 749 gput(G *gp)
 750 {
 751         M *mp;
 752
 753         // If g is wired, hand it off directly.
 754         if((mp = gp->lockedm) != nil && canaddmcpu()) {
 755                 mnextg(mp, gp);
 756                 return;
 757         }
 758
 759         // If g is the idle goroutine for an m, hand it off.
 760         if(gp->idlem != nil) {
 761                 if(gp->idlem->idleg != nil) {
 762                         runtime_printf("m%d idle out of sync: g%D g%D\n",
 763                                 gp->idlem->id,
 764                                 gp->idlem->idleg->goid, gp->goid);
 765                         runtime_throw("runtime: double idle");
 766                 }
 767                 gp->idlem->idleg = gp;
 768                 return;
 769         }
 770
 771         gp->schedlink = nil;
 772         if(runtime_sched.ghead == nil)
 773                 runtime_sched.ghead = gp;
 774         else
 775                 runtime_sched.gtail->schedlink = gp;
 776         runtime_sched.gtail = gp;
 777
 778         // increment gwait.
 779         // if it transitions to nonzero, set atomic gwaiting bit.
 780         if(runtime_sched.gwait++ == 0)
 781                 runtime_xadd(&runtime_sched.atomic, 1<<gwaitingShift);
 782 }
 783
 784 // Report whether gget would return something.
 785 static bool
 786 haveg(void)
 787 {
 788         return runtime_sched.ghead != nil || m->idleg != nil;
 789 }
 790
 791 // Get from `g' queue.  Sched must be locked.
 792 static G*
 793 gget(void)
 794 {
 795         G *gp;
 796
 797         gp = runtime_sched.ghead;
 798         if(gp) {
 799                 runtime_sched.ghead = gp->schedlink;
 800                 if(runtime_sched.ghead == nil)
 801                         runtime_sched.gtail = nil;
 802                 // decrement gwait.
 803                 // if it transitions to zero, clear atomic gwaiting bit.
 804                 if(--runtime_sched.gwait == 0)
 805                         runtime_xadd(&runtime_sched.atomic, -1<<gwaitingShift);
 806         } else if(m->idleg != nil) {
 807                 gp = m->idleg;
 808                 m->idleg = nil;
 809         }
 810         return gp;
 811 }
 812
 813 // Put on `m' list.  Sched must be locked.
 814 static void
 815 mput(M *mp)
 816 {
 817         mp->schedlink = runtime_sched.mhead;
 818         runtime_sched.mhead = mp;
 819         runtime_sched.mwait++;
 820 }
 821
 822 // Get an `m' to run `g'.  Sched must be locked.
 823 static M*
 824 mget(G *gp)
 825 {
 826         M *mp;
 827
 828         // if g has its own m, use it.
 829         if(gp && (mp = gp->lockedm) != nil)
 830                 return mp;
 831
 832         // otherwise use general m pool.
 833         if((mp = runtime_sched.mhead) != nil) {
 834                 runtime_sched.mhead = mp->schedlink;
 835                 runtime_sched.mwait--;
 836         }
 837         return mp;
 838 }
 839
 840 // Mark g ready to run.
 841 void
 842 runtime_ready(G *gp)
 843 {
 844         schedlock();
 845         readylocked(gp);
 846         schedunlock();
 847 }
 848
 849 // Mark g ready to run.  Sched is already locked.
 850 // G might be running already and about to stop.
 851 // The sched lock protects g->status from changing underfoot.
 852 static void
 853 readylocked(G *gp)
 854 {
 855         if(gp->m) {
 856                 // Running on another machine.
 857                 // Ready it when it stops.
 858                 gp->readyonstop = 1;
 859                 return;
 860         }
 861
 862         // Mark runnable.
 863         if(gp->status == Grunnable || gp->status == Grunning) {
 864                 runtime_printf("goroutine %D has status %d\n", gp->goid, gp->status);
 865                 runtime_throw("bad g->status in ready");
 866         }
 867         gp->status = Grunnable;
 868
 869         gput(gp);
 870         matchmg();
 871 }
 872
 873 // Same as readylocked but a different symbol so that
 874 // debuggers can set a breakpoint here and catch all
 875 // new goroutines.
 876 static void
 877 newprocreadylocked(G *gp)
 878 {
 879         readylocked(gp);
 880 }
 881
 882 // Pass g to m for running.
 883 // Caller has already incremented mcpu.
 884 static void
 885 mnextg(M *mp, G *gp)
 886 {
 887         runtime_sched.grunning++;
 888         mp->nextg = gp;
 889         if(mp->waitnextg) {
 890                 mp->waitnextg = 0;
 891                 if(mwakeup != nil)
 892                         runtime_notewakeup(&mwakeup->havenextg);
 893                 mwakeup = mp;
 894         }
 895 }
 896
 897 // Get the next goroutine that m should run.
 898 // Sched must be locked on entry, is unlocked on exit.
 899 // Makes sure that at most $GOMAXPROCS g's are
 900 // running on cpus (not in system calls) at any given time.
 901 static G*
 902 nextgandunlock(void)
 903 {
 904         G *gp;
 905         uint32 v;
 906
 907 top:
 908         if(atomic_mcpu(runtime_sched.atomic) >= maxgomaxprocs)
 909                 runtime_throw("negative mcpu");
 910
 911         // If there is a g waiting as m->nextg, the mcpu++
 912         // happened before it was passed to mnextg.
 913         if(m->nextg != nil) {
 914                 gp = m->nextg;
 915                 m->nextg = nil;
 916                 schedunlock();
 917                 return gp;
 918         }
 919
 920         if(m->lockedg != nil) {
 921                 // We can only run one g, and it's not available.
 922                 // Make sure some other cpu is running to handle
 923                 // the ordinary run queue.
 924                 if(runtime_sched.gwait != 0) {
 925                         matchmg();
 926                         // m->lockedg might have been on the queue.
 927                         if(m->nextg != nil) {
 928                                 gp = m->nextg;
 929                                 m->nextg = nil;
 930                                 schedunlock();
 931                                 return gp;
 932                         }
 933                 }
 934         } else {
 935                 // Look for work on global queue.
 936                 while(haveg() && canaddmcpu()) {
 937                         gp = gget();
 938                         if(gp == nil)
 939                                 runtime_throw("gget inconsistency");
 940
 941                         if(gp->lockedm) {
 942                                 mnextg(gp->lockedm, gp);
 943                                 continue;
 944                         }
 945                         runtime_sched.grunning++;
 946                         schedunlock();
 947                         return gp;
 948                 }
 949
 950                 // The while loop ended either because the g queue is empty
 951                 // or because we have maxed out our m procs running go
 952                 // code (mcpu >= mcpumax).  We need to check that
 953                 // concurrent actions by entersyscall/exitsyscall cannot
 954                 // invalidate the decision to end the loop.
 955                 //
 956                 // We hold the sched lock, so no one else is manipulating the
 957                 // g queue or changing mcpumax.  Entersyscall can decrement
 958                 // mcpu, but if does so when there is something on the g queue,
 959                 // the gwait bit will be set, so entersyscall will take the slow path
 960                 // and use the sched lock.  So it cannot invalidate our decision.
 961                 //
 962                 // Wait on global m queue.
 963                 mput(m);
 964         }
 965
 966         // Look for deadlock situation.
 967         // There is a race with the scavenger that causes false negatives:
 968         // if the scavenger is just starting, then we have
 969         //      scvg != nil && grunning == 0 && gwait == 0
 970         // and we do not detect a deadlock.  It is possible that we should
 971         // add that case to the if statement here, but it is too close to Go 1
 972         // to make such a subtle change.  Instead, we work around the
 973         // false negative in trivial programs by calling runtime.gosched
 974         // from the main goroutine just before main.main.
 975         // See runtime_main above.
 976         //
 977         // On a related note, it is also possible that the scvg == nil case is
 978         // wrong and should include gwait, but that does not happen in
 979         // standard Go programs, which all start the scavenger.
 980         //
 981         if((scvg == nil && runtime_sched.grunning == 0) ||
 982            (scvg != nil && runtime_sched.grunning == 1 && runtime_sched.gwait == 0 &&
 983             (scvg->status == Grunning || scvg->status == Gsyscall))) {
 984                 m->throwing = -1;  // do not dump full stacks
 985                 runtime_throw("all goroutines are asleep - deadlock!");
 986         }
 987
 988         m->nextg = nil;
 989         m->waitnextg = 1;
 990         runtime_noteclear(&m->havenextg);
 991
 992         // Stoptheworld is waiting for all but its cpu to go to stop.
 993         // Entersyscall might have decremented mcpu too, but if so
 994         // it will see the waitstop and take the slow path.
 995         // Exitsyscall never increments mcpu beyond mcpumax.
 996         v = runtime_atomicload(&runtime_sched.atomic);
 997         if(atomic_waitstop(v) && atomic_mcpu(v) <= atomic_mcpumax(v)) {
 998                 // set waitstop = 0 (known to be 1)
 999                 runtime_xadd(&runtime_sched.atomic, -1<<waitstopShift);
1000                 runtime_notewakeup(&runtime_sched.stopped);
1001         }
1002         schedunlock();
1003
1004         runtime_notesleep(&m->havenextg);
1005         if(m->helpgc) {
1006                 runtime_gchelper();
1007                 m->helpgc = 0;
1008                 runtime_lock(&runtime_sched);
1009                 goto top;
1010         }
1011         if((gp = m->nextg) == nil)
1012                 runtime_throw("bad m->nextg in nextgoroutine");
1013         m->nextg = nil;
1014         return gp;
1015 }
1016
1017 int32
1018 runtime_gcprocs(void)
1019 {
1020         int32 n;
1021
1022         // Figure out how many CPUs to use during GC.
1023         // Limited by gomaxprocs, number of actual CPUs, and MaxGcproc.
1024         n = runtime_gomaxprocs;
1025         if(n > runtime_ncpu)
1026                 n = runtime_ncpu > 0 ? runtime_ncpu : 1;
1027         if(n > MaxGcproc)
1028                 n = MaxGcproc;
1029         if(n > runtime_sched.mwait+1) // one M is currently running
1030                 n = runtime_sched.mwait+1;
1031         return n;
1032 }
1033
1034 void
1035 runtime_helpgc(int32 nproc)
1036 {
1037         M *mp;
1038         int32 n;
1039
1040         runtime_lock(&runtime_sched);
1041         for(n = 1; n < nproc; n++) { // one M is currently running
1042                 mp = mget(nil);
1043                 if(mp == nil)
1044                         runtime_throw("runtime_gcprocs inconsistency");
1045                 mp->helpgc = 1;
1046                 mp->waitnextg = 0;
1047                 runtime_notewakeup(&mp->havenextg);
1048         }
1049         runtime_unlock(&runtime_sched);
1050 }
1051
1052 void
1053 runtime_stoptheworld(void)
1054 {
1055         uint32 v;
1056
1057         schedlock();
1058         runtime_gcwaiting = 1;
1059
1060         setmcpumax(1);
1061
1062         // while mcpu > 1
1063         for(;;) {
1064                 v = runtime_sched.atomic;
1065                 if(atomic_mcpu(v) <= 1)
1066                         break;
1067
1068                 // It would be unsafe for multiple threads to be using
1069                 // the stopped note at once, but there is only
1070                 // ever one thread doing garbage collection.
1071                 runtime_noteclear(&runtime_sched.stopped);
1072                 if(atomic_waitstop(v))
1073                         runtime_throw("invalid waitstop");
1074
1075                 // atomic { waitstop = 1 }, predicated on mcpu <= 1 check above
1076                 // still being true.
1077                 if(!runtime_cas(&runtime_sched.atomic, v, v+(1<<waitstopShift)))
1078                         continue;
1079
1080                 schedunlock();
1081                 runtime_notesleep(&runtime_sched.stopped);
1082                 schedlock();
1083         }
1084         runtime_singleproc = runtime_gomaxprocs == 1;
1085         schedunlock();
1086 }
1087
1088 void
1089 runtime_starttheworld(void)
1090 {
1091         M *mp;
1092         int32 max;
1093
1094         // Figure out how many CPUs GC could possibly use.
1095         max = runtime_gomaxprocs;
1096         if(max > runtime_ncpu)
1097                 max = runtime_ncpu > 0 ? runtime_ncpu : 1;
1098         if(max > MaxGcproc)
1099                 max = MaxGcproc;
1100
1101         schedlock();
1102         runtime_gcwaiting = 0;
1103         setmcpumax(runtime_gomaxprocs);
1104         matchmg();
1105         if(runtime_gcprocs() < max && canaddmcpu()) {
1106                 // If GC could have used another helper proc, start one now,
1107                 // in the hope that it will be available next time.
1108                 // It would have been even better to start it before the collection,
1109                 // but doing so requires allocating memory, so it's tricky to
1110                 // coordinate.  This lazy approach works out in practice:
1111                 // we don't mind if the first couple gc rounds don't have quite
1112                 // the maximum number of procs.
1113                 // canaddmcpu above did mcpu++
1114                 // (necessary, because m will be doing various
1115                 // initialization work so is definitely running),
1116                 // but m is not running a specific goroutine,
1117                 // so set the helpgc flag as a signal to m's
1118                 // first schedule(nil) to mcpu-- and grunning--.
1119                 mp = runtime_newm();
1120                 mp->helpgc = 1;
1121                 runtime_sched.grunning++;
1122         }
1123         schedunlock();
1124 }
1125
1126 // Called to start an M.
1127 void*
1128 runtime_mstart(void* mp)
1129 {
1130         m = (M*)mp;
1131         g = m->g0;
1132
1133         initcontext();
1134
1135         g->entry = nil;
1136         g->param = nil;
1137
1138         // Record top of stack for use by mcall.
1139         // Once we call schedule we're never coming back,
1140         // so other calls can reuse this stack space.
1141 #ifdef USING_SPLIT_STACK
1142         __splitstack_getcontext(&g->stack_context[0]);
1143 #else
1144         g->gcinitial_sp = &mp;
1145         // Setting gcstack_size to 0 is a marker meaning that gcinitial_sp
1146         // is the top of the stack, not the bottom.
1147         g->gcstack_size = 0;
1148         g->gcnext_sp = &mp;
1149 #endif
1150         getcontext(&g->context);
1151
1152         if(g->entry != nil) {
1153                 // Got here from mcall.
1154                 void (*pfn)(G*) = (void (*)(G*))g->entry;
1155                 G* gp = (G*)g->param;
1156                 pfn(gp);
1157                 *(int*)0x21 = 0x21;
1158         }
1159         runtime_minit();
1160
1161 #ifdef USING_SPLIT_STACK
1162         {
1163           int dont_block_signals = 0;
1164           __splitstack_block_signals(&dont_block_signals, nil);
1165         }
1166 #endif
1167
1168         // Install signal handlers; after minit so that minit can
1169         // prepare the thread to be able to handle the signals.
1170         if(m == &runtime_m0)
1171                 runtime_initsig();
1172
1173         schedule(nil);
1174
1175         // TODO(brainman): This point is never reached, because scheduler
1176         // does not release os threads at the moment. But once this path
1177         // is enabled, we must remove our seh here.
1178
1179         return nil;
1180 }
1181
1182 typedef struct CgoThreadStart CgoThreadStart;
1183 struct CgoThreadStart
1184 {
1185         M *m;
1186         G *g;
1187         void (*fn)(void);
1188 };
1189
1190 // Kick off new m's as needed (up to mcpumax).
1191 // Sched is locked.
1192 static void
1193 matchmg(void)
1194 {
1195         G *gp;
1196         M *mp;
1197
1198         if(m->mallocing || m->gcing)
1199                 return;
1200
1201         while(haveg() && canaddmcpu()) {
1202                 gp = gget();
1203                 if(gp == nil)
1204                         runtime_throw("gget inconsistency");
1205
1206                 // Find the m that will run gp.
1207                 if((mp = mget(gp)) == nil)
1208                         mp = runtime_newm();
1209                 mnextg(mp, gp);
1210         }
1211 }
1212
1213 // Create a new m.  It will start off with a call to runtime_mstart.
1214 M*
1215 runtime_newm(void)
1216 {
1217         M *mp;
1218         pthread_attr_t attr;
1219         pthread_t tid;
1220         size_t stacksize;
1221         sigset_t clear;
1222         sigset_t old;
1223         int ret;
1224
1225 #if 0
1226         static const Type *mtype;  // The Go type M
1227         if(mtype == nil) {
1228                 Eface e;
1229                 runtime_gc_m_ptr(&e);
1230                 mtype = ((const PtrType*)e.__type_descriptor)->__element_type;
1231         }
1232 #endif
1233
1234         mp = runtime_mal(sizeof *mp);
1235         mcommoninit(mp);
1236         mp->g0 = runtime_malg(-1, nil, nil);
1237
1238         if(pthread_attr_init(&attr) != 0)
1239                 runtime_throw("pthread_attr_init");
1240         if(pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_DETACHED) != 0)
1241                 runtime_throw("pthread_attr_setdetachstate");
1242
1243         stacksize = PTHREAD_STACK_MIN;
1244
1245         // With glibc before version 2.16 the static TLS size is taken
1246         // out of the stack size, and we get an error or a crash if
1247         // there is not enough stack space left.  Add it back in if we
1248         // can, in case the program uses a lot of TLS space.  FIXME:
1249         // This can be disabled in glibc 2.16 and later, if the bug is
1250         // indeed fixed then.
1251         stacksize += tlssize;
1252
1253         if(pthread_attr_setstacksize(&attr, stacksize) != 0)
1254                 runtime_throw("pthread_attr_setstacksize");
1255
1256         // Block signals during pthread_create so that the new thread
1257         // starts with signals disabled.  It will enable them in minit.
1258         sigfillset(&clear);
1259         sigemptyset(&old);
1260         sigprocmask(SIG_BLOCK, &clear, &old);
1261         ret = pthread_create(&tid, &attr, runtime_mstart, mp);
1262         sigprocmask(SIG_SETMASK, &old, nil);
1263
1264         if (ret != 0)
1265                 runtime_throw("pthread_create");
1266
1267         return mp;
1268 }
1269
1270 // One round of scheduler: find a goroutine and run it.
1271 // The argument is the goroutine that was running before
1272 // schedule was called, or nil if this is the first call.
1273 // Never returns.
1274 static void
1275 schedule(G *gp)
1276 {
1277         int32 hz;
1278         uint32 v;
1279
1280         schedlock();
1281         if(gp != nil) {
1282                 // Just finished running gp.
1283                 gp->m = nil;
1284                 runtime_sched.grunning--;
1285
1286                 // atomic { mcpu-- }
1287                 v = runtime_xadd(&runtime_sched.atomic, -1<<mcpuShift);
1288                 if(atomic_mcpu(v) > maxgomaxprocs)
1289                         runtime_throw("negative mcpu in scheduler");
1290
1291                 switch(gp->status) {
1292                 case Grunnable:
1293                 case Gdead:
1294                         // Shouldn't have been running!
1295                         runtime_throw("bad gp->status in sched");
1296                 case Grunning:
1297                         gp->status = Grunnable;
1298                         gput(gp);
1299                         break;
1300                 case Gmoribund:
1301                         if(raceenabled)
1302                                 runtime_racegoend(gp->goid);
1303                         gp->status = Gdead;
1304                         if(gp->lockedm) {
1305                                 gp->lockedm = nil;
1306                                 m->lockedg = nil;
1307                         }
1308                         gp->idlem = nil;
1309                         runtime_memclr(&gp->context, sizeof gp->context);
1310                         gfput(gp);
1311                         if(--runtime_sched.gcount == 0)
1312                                 runtime_exit(0);
1313                         break;
1314                 }
1315                 if(gp->readyonstop) {
1316                         gp->readyonstop = 0;
1317                         readylocked(gp);
1318                 }
1319         } else if(m->helpgc) {
1320                 // Bootstrap m or new m started by starttheworld.
1321                 // atomic { mcpu-- }
1322                 v = runtime_xadd(&runtime_sched.atomic, -1<<mcpuShift);
1323                 if(atomic_mcpu(v) > maxgomaxprocs)
1324                         runtime_throw("negative mcpu in scheduler");
1325                 // Compensate for increment in starttheworld().
1326                 runtime_sched.grunning--;
1327                 m->helpgc = 0;
1328         } else if(m->nextg != nil) {
1329                 // New m started by matchmg.
1330         } else {
1331                 runtime_throw("invalid m state in scheduler");
1332         }
1333
1334         // Find (or wait for) g to run.  Unlocks runtime_sched.
1335         gp = nextgandunlock();
1336         gp->readyonstop = 0;
1337         gp->status = Grunning;
1338         m->curg = gp;
1339         gp->m = m;
1340
1341         // Check whether the profiler needs to be turned on or off.
1342         hz = runtime_sched.profilehz;
1343         if(m->profilehz != hz)
1344                 runtime_resetcpuprofiler(hz);
1345
1346         runtime_gogo(gp);
1347 }
1348
1349 // Enter scheduler.  If g->status is Grunning,
1350 // re-queues g and runs everyone else who is waiting
1351 // before running g again.  If g->status is Gmoribund,
1352 // kills off g.
1353 void
1354 runtime_gosched(void)
1355 {
1356         if(m->locks != 0)
1357                 runtime_throw("gosched holding locks");
1358         if(g == m->g0)
1359                 runtime_throw("gosched of g0");
1360         runtime_mcall(schedule);
1361 }
1362
1363 // Puts the current goroutine into a waiting state and unlocks the lock.
1364 // The goroutine can be made runnable again by calling runtime_ready(gp).
1365 void
1366 runtime_park(void (*unlockf)(Lock*), Lock *lock, const char *reason)
1367 {
1368         g->status = Gwaiting;
1369         g->waitreason = reason;
1370         if(unlockf)
1371                 unlockf(lock);
1372         runtime_gosched();
1373 }
1374
1375 // The goroutine g is about to enter a system call.
1376 // Record that it's not using the cpu anymore.
1377 // This is called only from the go syscall library and cgocall,
1378 // not from the low-level system calls used by the runtime.
1379 //
1380 // Entersyscall cannot split the stack: the runtime_gosave must
1381 // make g->sched refer to the caller's stack segment, because
1382 // entersyscall is going to return immediately after.
1383 // It's okay to call matchmg and notewakeup even after
1384 // decrementing mcpu, because we haven't released the
1385 // sched lock yet, so the garbage collector cannot be running.
1386
1387 void runtime_entersyscall(void) __attribute__ ((no_split_stack));
1388
1389 void
1390 runtime_entersyscall(void)
1391 {
1392         uint32 v;
1393
1394         if(m->profilehz > 0)
1395                 runtime_setprof(false);
1396
1397         // Leave SP around for gc and traceback.
1398 #ifdef USING_SPLIT_STACK
1399         g->gcstack = __splitstack_find(nil, nil, &g->gcstack_size,
1400                                        &g->gcnext_segment, &g->gcnext_sp,
1401                                        &g->gcinitial_sp);
1402 #else
1403         g->gcnext_sp = (byte *) &v;
1404 #endif
1405
1406         // Save the registers in the g structure so that any pointers
1407         // held in registers will be seen by the garbage collector.
1408         getcontext(&g->gcregs);
1409
1410         g->status = Gsyscall;
1411
1412         // Fast path.
1413         // The slow path inside the schedlock/schedunlock will get
1414         // through without stopping if it does:
1415         //      mcpu--
1416         //      gwait not true
1417         //      waitstop && mcpu <= mcpumax not true
1418         // If we can do the same with a single atomic add,
1419         // then we can skip the locks.
1420         v = runtime_xadd(&runtime_sched.atomic, -1<<mcpuShift);
1421         if(!atomic_gwaiting(v) && (!atomic_waitstop(v) || atomic_mcpu(v) > atomic_mcpumax(v)))
1422                 return;
1423
1424         schedlock();
1425         v = runtime_atomicload(&runtime_sched.atomic);
1426         if(atomic_gwaiting(v)) {
1427                 matchmg();
1428                 v = runtime_atomicload(&runtime_sched.atomic);
1429         }
1430         if(atomic_waitstop(v) && atomic_mcpu(v) <= atomic_mcpumax(v)) {
1431                 runtime_xadd(&runtime_sched.atomic, -1<<waitstopShift);
1432                 runtime_notewakeup(&runtime_sched.stopped);
1433         }
1434
1435         schedunlock();
1436 }
1437
1438 // The goroutine g exited its system call.
1439 // Arrange for it to run on a cpu again.
1440 // This is called only from the go syscall library, not
1441 // from the low-level system calls used by the runtime.
1442 void
1443 runtime_exitsyscall(void)
1444 {
1445         G *gp;
1446         uint32 v;
1447
1448         // Fast path.
1449         // If we can do the mcpu++ bookkeeping and
1450         // find that we still have mcpu <= mcpumax, then we can
1451         // start executing Go code immediately, without having to
1452         // schedlock/schedunlock.
1453         // Also do fast return if any locks are held, so that
1454         // panic code can use syscalls to open a file.
1455         gp = g;
1456         v = runtime_xadd(&runtime_sched.atomic, (1<<mcpuShift));
1457         if((m->profilehz == runtime_sched.profilehz && atomic_mcpu(v) <= atomic_mcpumax(v)) || m->locks > 0) {
1458                 // There's a cpu for us, so we can run.
1459                 gp->status = Grunning;
1460                 // Garbage collector isn't running (since we are),
1461                 // so okay to clear gcstack.
1462 #ifdef USING_SPLIT_STACK
1463                 gp->gcstack = nil;
1464 #endif
1465                 gp->gcnext_sp = nil;
1466                 runtime_memclr(&gp->gcregs, sizeof gp->gcregs);
1467
1468                 if(m->profilehz > 0)
1469                         runtime_setprof(true);
1470                 return;
1471         }
1472
1473         // Tell scheduler to put g back on the run queue:
1474         // mostly equivalent to g->status = Grunning,
1475         // but keeps the garbage collector from thinking
1476         // that g is running right now, which it's not.
1477         gp->readyonstop = 1;
1478
1479         // All the cpus are taken.
1480         // The scheduler will ready g and put this m to sleep.
1481         // When the scheduler takes g away from m,
1482         // it will undo the runtime_sched.mcpu++ above.
1483         runtime_gosched();
1484
1485         // Gosched returned, so we're allowed to run now.
1486         // Delete the gcstack information that we left for
1487         // the garbage collector during the system call.
1488         // Must wait until now because until gosched returns
1489         // we don't know for sure that the garbage collector
1490         // is not running.
1491 #ifdef USING_SPLIT_STACK
1492         gp->gcstack = nil;
1493 #endif
1494         gp->gcnext_sp = nil;
1495         runtime_memclr(&gp->gcregs, sizeof gp->gcregs);
1496 }
1497
1498 // Allocate a new g, with a stack big enough for stacksize bytes.
1499 G*
1500 runtime_malg(int32 stacksize, byte** ret_stack, size_t* ret_stacksize)
1501 {
1502         G *newg;
1503
1504         newg = runtime_malloc(sizeof(G));
1505         if(stacksize >= 0) {
1506 #if USING_SPLIT_STACK
1507                 int dont_block_signals = 0;
1508
1509                 *ret_stack = __splitstack_makecontext(stacksize,
1510                                                       &newg->stack_context[0],
1511                                                       ret_stacksize);
1512                 __splitstack_block_signals_context(&newg->stack_context[0],
1513                                                    &dont_block_signals, nil);
1514 #else
1515                 *ret_stack = runtime_mallocgc(stacksize, FlagNoProfiling|FlagNoGC, 0, 0);
1516                 *ret_stacksize = stacksize;
1517                 newg->gcinitial_sp = *ret_stack;
1518                 newg->gcstack_size = stacksize;
1519                 runtime_xadd(&runtime_stacks_sys, stacksize);
1520 #endif
1521         }
1522         return newg;
1523 }
1524
1525 /* For runtime package testing.  */
1526
1527 void runtime_testing_entersyscall(void)
1528   __asm__ (GOSYM_PREFIX "runtime.entersyscall");
1529
1530 void
1531 runtime_testing_entersyscall()
1532 {
1533         runtime_entersyscall();
1534 }
1535
1536 void runtime_testing_exitsyscall(void)
1537   __asm__ (GOSYM_PREFIX "runtime.exitsyscall");
1538
1539 void
1540 runtime_testing_exitsyscall()
1541 {
1542         runtime_exitsyscall();
1543 }
1544
1545 G*
1546 __go_go(void (*fn)(void*), void* arg)
1547 {
1548         byte *sp;
1549         size_t spsize;
1550         G *newg;
1551         int64 goid;
1552
1553         goid = runtime_xadd64((uint64*)&runtime_sched.goidgen, 1);
1554         if(raceenabled)
1555                 runtime_racegostart(goid, runtime_getcallerpc(&fn));
1556
1557         schedlock();
1558
1559         if((newg = gfget()) != nil) {
1560 #ifdef USING_SPLIT_STACK
1561                 int dont_block_signals = 0;
1562
1563                 sp = __splitstack_resetcontext(&newg->stack_context[0],
1564                                                &spsize);
1565                 __splitstack_block_signals_context(&newg->stack_context[0],
1566                                                    &dont_block_signals, nil);
1567 #else
1568                 sp = newg->gcinitial_sp;
1569                 spsize = newg->gcstack_size;
1570                 if(spsize == 0)
1571                         runtime_throw("bad spsize in __go_go");
1572                 newg->gcnext_sp = sp;
1573 #endif
1574         } else {
1575                 newg = runtime_malg(StackMin, &sp, &spsize);
1576                 if(runtime_lastg == nil)
1577                         runtime_allg = newg;
1578                 else
1579                         runtime_lastg->alllink = newg;
1580                 runtime_lastg = newg;
1581         }
1582         newg->status = Gwaiting;
1583         newg->waitreason = "new goroutine";
1584
1585         newg->entry = (byte*)fn;
1586         newg->param = arg;
1587         newg->gopc = (uintptr)__builtin_return_address(0);
1588
1589         runtime_sched.gcount++;
1590         newg->goid = goid;
1591
1592         if(sp == nil)
1593                 runtime_throw("nil g->stack0");
1594
1595         {
1596                 // Avoid warnings about variables clobbered by
1597                 // longjmp.
1598                 byte * volatile vsp = sp;
1599                 size_t volatile vspsize = spsize;
1600                 G * volatile vnewg = newg;
1601
1602                 getcontext(&vnewg->context);
1603                 vnewg->context.uc_stack.ss_sp = vsp;
1604 #ifdef MAKECONTEXT_STACK_TOP
1605                 vnewg->context.uc_stack.ss_sp += vspsize;
1606 #endif
1607                 vnewg->context.uc_stack.ss_size = vspsize;
1608                 makecontext(&vnewg->context, kickoff, 0);
1609
1610                 newprocreadylocked(vnewg);
1611                 schedunlock();
1612
1613                 return vnewg;
1614         }
1615 }
1616
1617 // Put on gfree list.  Sched must be locked.
1618 static void
1619 gfput(G *gp)
1620 {
1621         gp->schedlink = runtime_sched.gfree;
1622         runtime_sched.gfree = gp;
1623 }
1624
1625 // Get from gfree list.  Sched must be locked.
1626 static G*
1627 gfget(void)
1628 {
1629         G *gp;
1630
1631         gp = runtime_sched.gfree;
1632         if(gp)
1633                 runtime_sched.gfree = gp->schedlink;
1634         return gp;
1635 }
1636
1637 void runtime_Gosched (void) __asm__ (GOSYM_PREFIX "runtime.Gosched");
1638
1639 void
1640 runtime_Gosched(void)
1641 {
1642         runtime_gosched();
1643 }
1644
1645 // Implementation of runtime.GOMAXPROCS.
1646 // delete when scheduler is stronger
1647 int32
1648 runtime_gomaxprocsfunc(int32 n)
1649 {
1650         int32 ret;
1651         uint32 v;
1652
1653         schedlock();
1654         ret = runtime_gomaxprocs;
1655         if(n <= 0)
1656                 n = ret;
1657         if(n > maxgomaxprocs)
1658                 n = maxgomaxprocs;
1659         runtime_gomaxprocs = n;
1660         if(runtime_gomaxprocs > 1)
1661                 runtime_singleproc = false;
1662         if(runtime_gcwaiting != 0) {
1663                 if(atomic_mcpumax(runtime_sched.atomic) != 1)
1664                         runtime_throw("invalid mcpumax during gc");
1665                 schedunlock();
1666                 return ret;
1667         }
1668
1669         setmcpumax(n);
1670
1671         // If there are now fewer allowed procs
1672         // than procs running, stop.
1673         v = runtime_atomicload(&runtime_sched.atomic);
1674         if((int32)atomic_mcpu(v) > n) {
1675                 schedunlock();
1676                 runtime_gosched();
1677                 return ret;
1678         }
1679         // handle more procs
1680         matchmg();
1681         schedunlock();
1682         return ret;
1683 }
1684
1685 void
1686 runtime_LockOSThread(void)
1687 {
1688         if(m == &runtime_m0 && runtime_sched.init) {
1689                 runtime_sched.lockmain = true;
1690                 return;
1691         }
1692         m->lockedg = g;
1693         g->lockedm = m;
1694 }
1695
1696 void
1697 runtime_UnlockOSThread(void)
1698 {
1699         if(m == &runtime_m0 && runtime_sched.init) {
1700                 runtime_sched.lockmain = false;
1701                 return;
1702         }
1703         m->lockedg = nil;
1704         g->lockedm = nil;
1705 }
1706
1707 bool
1708 runtime_lockedOSThread(void)
1709 {
1710         return g->lockedm != nil && m->lockedg != nil;
1711 }
1712
1713 // for testing of callbacks
1714
1715 _Bool runtime_golockedOSThread(void)
1716   __asm__ (GOSYM_PREFIX "runtime.golockedOSThread");
1717
1718 _Bool
1719 runtime_golockedOSThread(void)
1720 {
1721         return runtime_lockedOSThread();
1722 }
1723
1724 // for testing of wire, unwire
1725 uint32
1726 runtime_mid()
1727 {
1728         return m->id;
1729 }
1730
1731 intgo runtime_NumGoroutine (void)
1732   __asm__ (GOSYM_PREFIX "runtime.NumGoroutine");
1733
1734 intgo
1735 runtime_NumGoroutine()
1736 {
1737         return runtime_sched.gcount;
1738 }
1739
1740 int32
1741 runtime_gcount(void)
1742 {
1743         return runtime_sched.gcount;
1744 }
1745
1746 int32
1747 runtime_mcount(void)
1748 {
1749         return runtime_sched.mcount;
1750 }
1751
1752 static struct {
1753         Lock;
1754         void (*fn)(uintptr*, int32);
1755         int32 hz;
1756         uintptr pcbuf[100];
1757         Location locbuf[100];
1758 } prof;
1759
1760 // Called if we receive a SIGPROF signal.
1761 void
1762 runtime_sigprof()
1763 {
1764         int32 n, i;
1765
1766         if(prof.fn == nil || prof.hz == 0)
1767                 return;
1768
1769         runtime_lock(&prof);
1770         if(prof.fn == nil) {
1771                 runtime_unlock(&prof);
1772                 return;
1773         }
1774         n = runtime_callers(0, prof.locbuf, nelem(prof.locbuf));
1775         for(i = 0; i < n; i++)
1776                 prof.pcbuf[i] = prof.locbuf[i].pc;
1777         if(n > 0)
1778                 prof.fn(prof.pcbuf, n);
1779         runtime_unlock(&prof);
1780 }
1781
1782 // Arrange to call fn with a traceback hz times a second.
1783 void
1784 runtime_setcpuprofilerate(void (*fn)(uintptr*, int32), int32 hz)
1785 {
1786         // Force sane arguments.
1787         if(hz < 0)
1788                 hz = 0;
1789         if(hz == 0)
1790                 fn = nil;
1791         if(fn == nil)
1792                 hz = 0;
1793
1794         // Stop profiler on this cpu so that it is safe to lock prof.
1795         // if a profiling signal came in while we had prof locked,
1796         // it would deadlock.
1797         runtime_resetcpuprofiler(0);
1798
1799         runtime_lock(&prof);
1800         prof.fn = fn;
1801         prof.hz = hz;
1802         runtime_unlock(&prof);
1803         runtime_lock(&runtime_sched);
1804         runtime_sched.profilehz = hz;
1805         runtime_unlock(&runtime_sched);
1806
1807         if(hz != 0)
1808                 runtime_resetcpuprofiler(hz);
1809 }