VMS/VMS_Implementations/VMS_impls/VMS__MC_shared

comparison MasterLoop.c @ 31:e69579a0e797

Works multi-core.. pinned VP to a core loop

author	Me
date	Wed, 01 Sep 2010 08:23:39 -0700
parents	c8823e0bb2b4
children	17d20e5cf924

comparison

equal deleted inserted replaced

-:acd91b87dcdc
+:73e221819099
 * directly at end of master loop
 *So VMS__init just births the master virtual processor same way it births
 * all the others -- then does any extra setup needed and puts it into the
 * work queue.
 *However means have to make masterEnv a global static volatile the same way
-* did with workQ in core loop.  -- for performance, put the
+* did with readyToAnimateQ in core loop.  -- for performance, put the
 * jump to the core loop directly in here, and have it directly jump back.
+*
+*
+*Aug 18, 2010 -- Going to a separate MasterVP for each core, to see if this
+* avoids the suspected bug in the system stack that causes bizarre faults
+* at random places in the system code.
+*
+*So, this function is coupled to each of the MasterVPs, -- meaning this
+* function can't rely on a particular stack and frame -- each MasterVP that
+* animates this function has a different one.
+*
+*At this point, the masterLoop does not write itself into the queue anymore,
+* instead, the coreLoop acquires the masterLock when it has nothing to
+* animate, and then animates its own masterLoop.  However, still try to put
+* several AppVPs into the queue to amortize the startup cost of switching
+* to the MasterVP.  Note, don't have to worry about latency of requests much
+* because most requests generate work for same core -- only latency issue
+* is case when other cores starved and one core's requests generate work
+* for them -- so keep max in queue to 3 or 4..
 */
-void masterLoop( void *initData, VirtProcr *masterPr )
+void masterLoop( void *initData, VirtProcr *animatingPr )
 {
-int             slotIdx, numFilled, filledSlotIdx, masterHasBeenQueued;
+int             slotIdx;
 VirtProcr      *schedVirtPr;
-SchedSlot      *currSlot, **schedSlots, **filledSlots;
+SchedSlot      *currSlot, **schedSlots;
 MasterEnv      *masterEnv;
-VMSQueueStruc  *workQ;
+VMSQueueStruc  *readyToAnimateQ;
-void           *jmpPt, *stackPtrAddr, *framePtrAddr, *stillRunningAddr;
-void           *coreLoopFramePtr, *coreLoopStackPtr, *semanticEnv;
 SlaveScheduler  slaveScheduler;
 RequestHandler  requestHandler;
+void           *semanticEnv;
-//this will run as the first virt processor in workQ, and will be a
+int             thisCoresIdx;
-// new born -- so will do all the GCC-generated allocating space on
+VirtProcr      *masterPr;
-// the stack owned by master virt procr -- and will run this last bit
+volatile        VirtProcr *volatileMasterPr;
-// of setup code..
+volatileMasterPr = animatingPr;
+masterPr         = volatileMasterPr; //used to force re-define after jmp
+//First animation of each MasterVP will in turn animate this part
+// of setup code.. (VP creator sets up the stack as if this function
+// was called normally, but actually get here by jmp)
+//So, setup values about stack ptr, jmp pt and all that
 masterPr->nextInstrPt = &&masterLoopStartPt;
-//The second time MasterVP comes out of queue, the first animation of
-// it hasn't written the stackPtr and framePtr yet -- but the second
-// animation has already had its stackPtr and framePtr set to the old
-// value by the coreLoop.  Fix this by writing the correct stack and
-// frame pointers here, at which point they're correct in the first
-// animation of MasterVP.
-//TODO: remove writing stackPtr and framePtr at the bottom, for eff
-stackPtrAddr      = &(masterPr->stackPtr);
-framePtrAddr      = &(masterPr->framePtr);
-asm volatile("movl %0,     %%eax;  \
+//Note, got rid of writing the stack and frame ptr up here, because
-movl %%esp, (%%eax); \
+// only one
-movl %1,     %%eax;  \
+// core can ever animate a given MasterVP, so don't need to communicate
-movl %%ebp, (%%eax); "
+// new frame and stack ptr to the MasterVP storage before a second
-/* outputs */ : "=g" (stackPtrAddr), "=g" (framePtrAddr)                 \
+// version of that MasterVP can get animated on a different core.
-/* inputs  */ :                                                          \
+//Also got rid of the busy-wait.
-/* clobber */ : "memory", "%eax", "%ebx"                                 \
-);
+masterLoopStartPt:
+masterEnv        = _VMSMasterEnv;
+//TODO: check that compiles so that always re-define from frame-storage
+masterPr         = volatileMasterPr;  //just to make sure after jmp
+thisCoresIdx     = masterPr->coreAnimatedBy;
+readyToAnimateQ  = masterEnv->readyToAnimateQs[thisCoresIdx];
+schedSlots       = masterEnv->allSchedSlots[thisCoresIdx];
+requestHandler   = masterEnv->requestHandler;
+slaveScheduler   = masterEnv->slaveScheduler;
+semanticEnv      = masterEnv->semanticEnv;
-masterLoopStartPt:
+//Poll each slot's Done flag
-//if another reference to same Master VirtProcr still going, busy-wait
-//Could put this lower, but don't want to think about shared stack..
-while( _VMSMasterEnv->stillRunning ) /*busy wait*/ ;
-//TODO: want to do busy-wait as assembly, to be sure stack not touched?
-//this is the only master running now, set flag again
-_VMSMasterEnv->stillRunning = TRUE;
-masterEnv = _VMSMasterEnv;
-//TODO: gdb -- check that a volatile _VMSMasterEnv and _VMSWorkQ means
-// all these will be re-filled every time jump here..
-workQ            = _VMSWorkQ;
-requestHandler   = masterEnv->requestHandler;
-slaveScheduler   = masterEnv->slaveScheduler;
-schedSlots       = masterEnv->schedSlots;
-filledSlots      = masterEnv->filledSlots;
-masterPr         = masterEnv->masterVirtPr;  //post-jmp clobbered, re-load
-semanticEnv      = masterEnv->semanticEnv;
-//prepare for scheduling
-numFilled = 0;
-masterHasBeenQueued = FALSE;
-//Poll each slot's Done flag -- slot 0 reserved for master, start at 1
 for( slotIdx = 0; slotIdx < NUM_SCHED_SLOTS; slotIdx++)
 {
 currSlot = schedSlots[ slotIdx ];
 if( currSlot->workIsDone )
 (*requestHandler)( currSlot->procrAssignedToSlot, semanticEnv );
 }
 if( currSlot->needsProcrAssigned )
 {    //give slot a new virt procr
 schedVirtPr =
-(*slaveScheduler)( semanticEnv );
+(*slaveScheduler)( semanticEnv, thisCoresIdx );
 if( schedVirtPr != NULL )
 { currSlot->procrAssignedToSlot = schedVirtPr;
 schedVirtPr->schedSlot        = currSlot;
 currSlot->needsProcrAssigned  = FALSE;
-filledSlots[ numFilled ]      = currSlot;
+writeSRSWQ( schedVirtPr, readyToAnimateQ );
-writeVMSQ( schedVirtPr, workQ );
-numFilled += 1;
-if( numFilled == masterEnv->numToPrecede )
-{
-writeVMSQ( masterEnv->masterVirtPr, workQ );
-masterHasBeenQueued = TRUE;
-}
 }
 }
 }
-if( !masterHasBeenQueued )
-{
-writeVMSQ( masterEnv->masterVirtPr, workQ );
-}
-//Adjust the number to precede, for next round -- assume rate of
+//Save stack ptr and frame, restore CoreLoop's stack and frame,
-// finishing work is stable -- which is a bad assumption!  But, just
+// and clear the MasterLock
-// want something working for the moment, look at dynamic behavior
-// later
-//TODO: look at dynamic behavior -- time-average numToPrecede or something
-if( numFilled < NUM_CORES - 1 )
-{
-masterEnv->numToPrecede = 1;
-}
-else
-{ masterEnv->numToPrecede = numFilled - NUM_CORES + 1;
-}
-//Save stack ptr and frame -- don't need to, take out later, but safe
-// Also, wait to set stillRunning to FALSE until just before jump, to
-// be safe -- although the two simulatneously animated MasterLoops
-// are on different cores, so have different stacks, so no worries
-// there.
-//Restore CoreLoop's stack frame (and stack pointer, to be safe)
 //TODO: cafefully verify don't need to force saving anything to stack
 // before jumping back to core loop.
+void           *stackPtrAddr, *framePtrAddr, *masterLockAddr;
+void           *jmpPt, *coreLoopFramePtr, *coreLoopStackPtr;
 stackPtrAddr      = &(masterPr->stackPtr);
 framePtrAddr      = &(masterPr->framePtr);
-stillRunningAddr  = &(_VMSMasterEnv->stillRunning); //when race condition
+masterLockAddr    = &(_VMSMasterEnv->masterLock);
-//arises, stillRunning is shared between the two cores both animating
-// MasterLoop -- but those two cores have different esp & ebp, so safe
-// to change stack and frame pointer here, without one messing up other
-// one
-jmpPt             = masterPr->coreLoopStartPt;
+jmpPt             = _VMSMasterEnv->coreLoopStartPt;
 coreLoopFramePtr  = masterPr->coreLoopFramePtr;//need this only
 coreLoopStackPtr  = masterPr->coreLoopStackPtr;//shouldn't need -- safety
 asm volatile("movl %0,     %%eax;  \
 movl %%esp, (%%eax); \
 movl %4, %%esp;      \
 movl %5, %%ebp;      \
 movl $0x0, (%%ebx);  \
 jmp  %%eax;"         \
 /* outputs */ : "=g" (stackPtrAddr), "=g" (framePtrAddr),                \
-"=g"(stillRunningAddr)                                   \
+"=g"(masterLockAddr)                                   \
 /* inputs  */ : "g" (jmpPt), "g"(coreLoopStackPtr), "g"(coreLoopFramePtr)\
 /* clobber */ : "memory", "%eax", "%ebx", "%ecx", "%edx", "%edi", "%esi" \
 );//can probably make clobber list empty -- but safe for now
 }

Mercurial > cgi-bin > hgwebdir.cgi > VMS > VMS_Implementations > VMS_impls > VMS__MC_shared_impl

comparison MasterLoop.c @ 31:e69579a0e797