1797 lines
32 KiB
C
1797 lines
32 KiB
C
/*
|
|
* This file is part of Jehanne.
|
|
*
|
|
* Copyright (C) 2015-2016 Giacomo Tesio <giacomo@tesio.it>
|
|
*
|
|
* Jehanne is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, version 2 of the License.
|
|
*
|
|
* Jehanne is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with Jehanne. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
#include <u.h>
|
|
#include "../port/lib.h"
|
|
#include "mem.h"
|
|
#include "dat.h"
|
|
#include "fns.h"
|
|
#include "../port/error.h"
|
|
|
|
#include "errstr.h"
|
|
#include <ptrace.h>
|
|
|
|
int nrdy;
|
|
Ref noteidalloc;
|
|
|
|
uint32_t delayedscheds; /* statistics */
|
|
long skipscheds;
|
|
long preempts;
|
|
|
|
static Ref pidalloc;
|
|
static int machnoalloc;
|
|
|
|
struct Procalloc procalloc;
|
|
|
|
extern Proc* psalloc(void);
|
|
extern void pshash(Proc*);
|
|
extern void psrelease(Proc*);
|
|
extern void psunhash(Proc*);
|
|
|
|
enum
|
|
{
|
|
Scaling=2,
|
|
};
|
|
|
|
static int reprioritize(Proc*);
|
|
static void updatecpu(Proc*);
|
|
static int64_t schedgain = 30; /* units in seconds */
|
|
|
|
static void rebalance(void);
|
|
static uint32_t balancetime;
|
|
|
|
Schedq runq[Npriq];
|
|
uint32_t runvec;
|
|
|
|
char *statename[] =
|
|
{ /* BUG: generate automatically */
|
|
"Dead",
|
|
"Moribund",
|
|
"Broken",
|
|
"Ready",
|
|
"Scheding",
|
|
"Running",
|
|
"Queueing",
|
|
"QueueingR",
|
|
"QueueingW",
|
|
"Wakeme",
|
|
"Stopped",
|
|
"Rendez",
|
|
"Waitrelease",
|
|
};
|
|
|
|
/*
|
|
* Always splhi()'ed.
|
|
*/
|
|
void
|
|
schedinit(void) /* never returns */
|
|
{
|
|
setlabel(&m->sched);
|
|
if(up) {
|
|
updatecpu(up);
|
|
m->proc = 0;
|
|
switch(up->state) {
|
|
case Running:
|
|
ready(up);
|
|
break;
|
|
case Moribund:
|
|
up->state = Dead;
|
|
|
|
/*
|
|
* Holding lock from pexit:
|
|
* procalloc
|
|
*/
|
|
mmurelease(up);
|
|
|
|
psrelease(up);
|
|
unlock(&procalloc.l);
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
up->mach = nil;
|
|
coherence();
|
|
up = nil;
|
|
}
|
|
sched();
|
|
}
|
|
|
|
/*
|
|
* If changing this routine, look also at sleep(). It
|
|
* contains a copy of the guts of sched().
|
|
*/
|
|
void
|
|
sched(void)
|
|
{
|
|
Proc *p;
|
|
|
|
if(m->ilockdepth)
|
|
panic("cpu%d: ilockdepth %d, last lock %#p at %#p, sched called from %#p",
|
|
m->machno,
|
|
m->ilockdepth,
|
|
up? up->lastilock: nil,
|
|
(up && up->lastilock)? lockgetpc(up->lastilock): m->ilockpc,
|
|
getcallerpc());
|
|
|
|
if(up){
|
|
/*
|
|
* Delay the sched until the process gives up the locks
|
|
* it is holding. This avoids dumb lock loops.
|
|
* Don't delay if the process is Moribund: it called sched to die.
|
|
*/
|
|
if(up->nlocks && up->state != Moribund)
|
|
if(up->delaysched < 20 || proc_own_pagepool(up)){
|
|
up->delaysched++;
|
|
delayedscheds++;
|
|
return;
|
|
}
|
|
up->delaysched = 0;
|
|
|
|
splhi();
|
|
|
|
/* statistics */
|
|
m->cs++;
|
|
|
|
procsave(up);
|
|
if(setlabel(&up->sched)){
|
|
procrestore(up);
|
|
spllo();
|
|
return;
|
|
}
|
|
gotolabel(&m->sched);
|
|
}
|
|
p = runproc();
|
|
updatecpu(p);
|
|
p->priority = reprioritize(p);
|
|
if(p != m->readied)
|
|
m->schedticks = m->ticks + HZ/10;
|
|
m->readied = 0;
|
|
up = p;
|
|
lock(&up->rlock);
|
|
up->state = Running;
|
|
up->mach = m;
|
|
m->proc = up;
|
|
unlock(&up->rlock);
|
|
mmuswitch(up);
|
|
gotolabel(&up->sched);
|
|
}
|
|
|
|
int
|
|
anyready(void)
|
|
{
|
|
return runvec;
|
|
}
|
|
|
|
int
|
|
anyhigher(void)
|
|
{
|
|
return runvec & ~((1<<(up->priority+1))-1);
|
|
}
|
|
|
|
/*
|
|
* here once per clock tick to see if we should resched
|
|
*/
|
|
void
|
|
hzsched(void)
|
|
{
|
|
/* once a second, rebalance will reprioritize ready procs */
|
|
if(m->machno == 0)
|
|
rebalance();
|
|
|
|
/* unless preempted, get to run for at least 100ms */
|
|
if(anyhigher()
|
|
|| (!up->fixedpri && m->ticks > m->schedticks && anyready())){
|
|
m->readied = nil; /* avoid cooperative scheduling */
|
|
up->delaysched++;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* here at the end of non-clock interrupts to see if we should preempt the
|
|
* current process. Returns 1 if preempted, 0 otherwise.
|
|
*/
|
|
int
|
|
preempted(void)
|
|
{
|
|
if(up && up->state == Running &&
|
|
!up->preempted &&
|
|
anyhigher() &&
|
|
!active.exiting){
|
|
m->readied = nil; /* avoid cooperative scheduling */
|
|
up->preempted = 1;
|
|
sched();
|
|
splhi();
|
|
up->preempted = 0;
|
|
return 1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
* Update the cpu time average for this particular process,
|
|
* which is about to change from up -> not up or vice versa.
|
|
* p->lastupdate is the last time an updatecpu happened.
|
|
*
|
|
* The cpu time average is a decaying average that lasts
|
|
* about D clock ticks. D is chosen to be approximately
|
|
* the cpu time of a cpu-intensive "quick job". A job has to run
|
|
* for approximately D clock ticks before we home in on its
|
|
* actual cpu usage. Thus if you manage to get in and get out
|
|
* quickly, you won't be penalized during your burst. Once you
|
|
* start using your share of the cpu for more than about D
|
|
* clock ticks though, your p->cpu hits 1000 (1.0) and you end up
|
|
* below all the other quick jobs. Interactive tasks, because
|
|
* they basically always use less than their fair share of cpu,
|
|
* will be rewarded.
|
|
*
|
|
* If the process has not been running, then we want to
|
|
* apply the filter
|
|
*
|
|
* cpu = cpu * (D-1)/D
|
|
*
|
|
* n times, yielding
|
|
*
|
|
* cpu = cpu * ((D-1)/D)^n
|
|
*
|
|
* but D is big enough that this is approximately
|
|
*
|
|
* cpu = cpu * (D-n)/D
|
|
*
|
|
* so we use that instead.
|
|
*
|
|
* If the process has been running, we apply the filter to
|
|
* 1 - cpu, yielding a similar equation. Note that cpu is
|
|
* stored in fixed point (* 1000).
|
|
*
|
|
* Updatecpu must be called before changing up, in order
|
|
* to maintain accurate cpu usage statistics. It can be called
|
|
* at any time to bring the stats for a given proc up-to-date.
|
|
*/
|
|
static void
|
|
updatecpu(Proc *p)
|
|
{
|
|
int64_t D, n, t, ocpu;
|
|
|
|
t = sys->ticks*Scaling + Scaling/2;
|
|
n = t - p->lastupdate;
|
|
p->lastupdate = t;
|
|
|
|
if(n == 0)
|
|
return;
|
|
D = schedgain*HZ*Scaling;
|
|
if(n > D)
|
|
n = D;
|
|
|
|
ocpu = p->cpu;
|
|
if(p != up)
|
|
p->cpu = (ocpu*(D-n))/D;
|
|
else{
|
|
t = 1000 - ocpu;
|
|
t = (t*(D-n))/D;
|
|
p->cpu = 1000 - t;
|
|
}
|
|
|
|
//iprint("pid %d %s for %d cpu %d -> %d\n", p->pid,p==up?"active":"inactive",n, ocpu,p->cpu);
|
|
}
|
|
|
|
/*
|
|
* On average, p has used p->cpu of a cpu recently.
|
|
* Its fair share is sys->nmach/m->load of a cpu. If it has been getting
|
|
* too much, penalize it. If it has been getting not enough, reward it.
|
|
* I don't think you can get much more than your fair share that
|
|
* often, so most of the queues are for using less. Having a priority
|
|
* of 3 means you're just right. Having a higher priority (up to p->basepri)
|
|
* means you're not using as much as you could.
|
|
*/
|
|
static int
|
|
reprioritize(Proc *p)
|
|
{
|
|
int fairshare, n, load, ratio;
|
|
|
|
load = sys->machptr[0]->load;
|
|
if(load == 0)
|
|
return p->basepri;
|
|
|
|
/*
|
|
* fairshare = 1.000 * ncpu * 1.000/load,
|
|
* except the decimal point is moved three places
|
|
* on both load and fairshare.
|
|
*/
|
|
fairshare = (sys->nmach*1000*1000)/load;
|
|
n = p->cpu;
|
|
if(n == 0)
|
|
n = 1;
|
|
ratio = (fairshare+n/2) / n;
|
|
if(ratio > p->basepri)
|
|
ratio = p->basepri;
|
|
if(ratio < 0)
|
|
panic("reprioritize");
|
|
//iprint("pid %d cpu %d load %d fair %d pri %d\n", p->pid, p->cpu, load, fairshare, ratio);
|
|
return ratio;
|
|
}
|
|
|
|
/*
|
|
* add a process to a scheduling queue
|
|
*/
|
|
void
|
|
queueproc(Schedq *rq, Proc *p)
|
|
{
|
|
int pri;
|
|
|
|
pri = rq - runq;
|
|
lock(&runq->l);
|
|
p->priority = pri;
|
|
p->rnext = 0;
|
|
if(rq->tail)
|
|
rq->tail->rnext = p;
|
|
else
|
|
rq->head = p;
|
|
rq->tail = p;
|
|
rq->n++;
|
|
nrdy++;
|
|
runvec |= 1<<pri;
|
|
unlock(&runq->l);
|
|
}
|
|
|
|
/*
|
|
* try to remove a process from a scheduling queue (called splhi)
|
|
*/
|
|
Proc*
|
|
dequeueproc(Schedq *rq, Proc *tp)
|
|
{
|
|
Proc *l, *p;
|
|
|
|
if(!canlock(&runq->l))
|
|
return nil;
|
|
|
|
/*
|
|
* the queue may have changed before we locked runq,
|
|
* refind the target process.
|
|
*/
|
|
l = 0;
|
|
for(p = rq->head; p; p = p->rnext){
|
|
if(p == tp)
|
|
break;
|
|
l = p;
|
|
}
|
|
|
|
/*
|
|
* p->mach==0 only when process state is saved
|
|
*/
|
|
if(p == 0 || p->mach){
|
|
unlock(&runq->l);
|
|
return nil;
|
|
}
|
|
if(p->rnext == 0)
|
|
rq->tail = l;
|
|
if(l)
|
|
l->rnext = p->rnext;
|
|
else
|
|
rq->head = p->rnext;
|
|
if(rq->head == nil)
|
|
runvec &= ~(1<<(rq-runq));
|
|
rq->n--;
|
|
nrdy--;
|
|
if(p->state != Ready)
|
|
jehanne_print("dequeueproc %s %d %s\n", p->text, p->pid, statename[p->state]);
|
|
|
|
unlock(&runq->l);
|
|
return p;
|
|
}
|
|
|
|
/*
|
|
* ready(p) picks a new priority for a process and sticks it in the
|
|
* runq for that priority.
|
|
*/
|
|
void
|
|
ready(Proc *p)
|
|
{
|
|
Mreg s;
|
|
int pri;
|
|
Schedq *rq;
|
|
void (*pt)(Proc*, int, int64_t, int64_t);
|
|
|
|
s = splhi();
|
|
|
|
if(up != p && (p->wired == nil || p->wired == m))
|
|
m->readied = p; /* group scheduling */
|
|
|
|
updatecpu(p);
|
|
pri = reprioritize(p);
|
|
p->priority = pri;
|
|
rq = &runq[pri];
|
|
p->state = Ready;
|
|
queueproc(rq, p);
|
|
pt = proctrace;
|
|
if(pt)
|
|
pt(p, SReady, 0, 0);
|
|
splx(s);
|
|
}
|
|
|
|
/*
|
|
* yield the processor and drop our priority
|
|
*/
|
|
void
|
|
yield(void)
|
|
{
|
|
if(anyready()){
|
|
/* pretend we just used 1/2 tick */
|
|
up->lastupdate -= Scaling/2;
|
|
sched();
|
|
}
|
|
}
|
|
|
|
/*
|
|
* recalculate priorities once a second. We need to do this
|
|
* since priorities will otherwise only be recalculated when
|
|
* the running process blocks.
|
|
*/
|
|
static void
|
|
rebalance(void)
|
|
{
|
|
Mreg s;
|
|
int pri, npri;
|
|
int64_t t;
|
|
Schedq *rq;
|
|
Proc *p;
|
|
|
|
t = m->ticks;
|
|
if(t - balancetime < HZ)
|
|
return;
|
|
balancetime = t;
|
|
|
|
for(pri=0, rq=runq; pri<Npriq; pri++, rq++){
|
|
another:
|
|
p = rq->head;
|
|
if(p == nil)
|
|
continue;
|
|
if(p->mp != m)
|
|
continue;
|
|
if(pri == p->basepri)
|
|
continue;
|
|
updatecpu(p);
|
|
npri = reprioritize(p);
|
|
if(npri != pri){
|
|
s = splhi();
|
|
p = dequeueproc(rq, p);
|
|
if(p)
|
|
queueproc(&runq[npri], p);
|
|
splx(s);
|
|
goto another;
|
|
}
|
|
}
|
|
}
|
|
|
|
/*
|
|
* pick a process to run
|
|
*/
|
|
Proc*
|
|
runproc(void)
|
|
{
|
|
Schedq *rq;
|
|
Proc *p;
|
|
uint64_t start, now;
|
|
int i;
|
|
void (*pt)(Proc*, int, int64_t, int64_t);
|
|
|
|
start = perfticks();
|
|
|
|
/* cooperative scheduling until the clock ticks */
|
|
if((p=m->readied) && p->mach==0 && p->state==Ready
|
|
&& (p->wired == nil || p->wired == m)
|
|
&& runq[Npriq-1].head == nil && runq[Npriq-2].head == nil){
|
|
skipscheds++;
|
|
rq = &runq[p->priority];
|
|
goto found;
|
|
}
|
|
|
|
preempts++;
|
|
|
|
loop:
|
|
/*
|
|
* find a process that last ran on this processor (affinity),
|
|
* or one that hasn't moved in a while (load balancing). Every
|
|
* time around the loop affinity goes down.
|
|
*/
|
|
spllo();
|
|
for(i = 0;; i++){
|
|
/*
|
|
* find the highest priority target process that this
|
|
* processor can run given affinity constraints.
|
|
*
|
|
*/
|
|
for(rq = &runq[Npriq-1]; rq >= runq; rq--){
|
|
for(p = rq->head; p; p = p->rnext){
|
|
if(p->mp == nil || p->mp == m
|
|
|| (!p->wired && i > 0))
|
|
goto found;
|
|
}
|
|
}
|
|
|
|
/* waste time or halt the CPU */
|
|
idlehands();
|
|
|
|
/* remember how much time we're here */
|
|
now = perfticks();
|
|
m->perf.inidle += now-start;
|
|
start = now;
|
|
}
|
|
|
|
found:
|
|
splhi();
|
|
p = dequeueproc(rq, p);
|
|
if(p == nil)
|
|
goto loop;
|
|
|
|
p->state = Scheding;
|
|
p->mp = m;
|
|
|
|
pt = proctrace;
|
|
if(pt)
|
|
pt(p, SRun, 0, 0);
|
|
return p;
|
|
}
|
|
|
|
void
|
|
pickmach(Proc *p)
|
|
{
|
|
Mach *mp;
|
|
int i;
|
|
|
|
if(sys->nmach < 2)
|
|
return;
|
|
for(;;){
|
|
i = (uint32_t)ainc(&machnoalloc)%sys->nmach;
|
|
mp = sys->machptr[i];
|
|
if(mp->online){
|
|
p->mp = mp;
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
|
|
Proc*
|
|
newproc(void)
|
|
{
|
|
Proc *p;
|
|
|
|
p = psalloc();
|
|
|
|
p->state = Scheding;
|
|
p->inkernel = 0;
|
|
p->cursyscall = 0;
|
|
p->psstate = "New";
|
|
p->mach = 0;
|
|
p->qnext = 0;
|
|
p->nchild = 0;
|
|
p->nwait = 0;
|
|
p->waitq = 0;
|
|
p->parent = 0;
|
|
p->pgrp = 0;
|
|
p->egrp = 0;
|
|
p->fgrp = 0;
|
|
p->rgrp = 0;
|
|
p->pdbg = 0;
|
|
p->kp = 0;
|
|
if(up != nil && up->procctl == Proc_tracesyscall)
|
|
p->procctl = Proc_tracesyscall;
|
|
else
|
|
p->procctl = 0;
|
|
p->blockingfd = -1;
|
|
p->syscallq = nil;
|
|
p->notepending = 0;
|
|
p->notedeferred = 0;
|
|
p->ureg = 0;
|
|
p->privatemem = 0;
|
|
p->errstr = p->errbuf0;
|
|
p->syserrstr = p->errbuf1;
|
|
p->errbuf0[0] = '\0';
|
|
p->errbuf1[0] = '\0';
|
|
p->nlocks = 0;
|
|
p->delaysched = 0;
|
|
p->trace = 0;
|
|
kstrdup(&p->user, "*nouser");
|
|
kstrdup(&p->text, "*notext");
|
|
p->args = nil;
|
|
p->nargs = 0;
|
|
p->setargs = 0;
|
|
jehanne_memset(p->seg, 0, sizeof p->seg);
|
|
p->pid = incref(&pidalloc);
|
|
pshash(p);
|
|
p->noteid = incref(¬eidalloc);
|
|
if(p->pid <= 0 || p->noteid <= 0)
|
|
panic("pidalloc");
|
|
if(p->kstack == 0)
|
|
p->kstack = smalloc(KSTACK);
|
|
|
|
/* sched params */
|
|
p->mp = 0;
|
|
p->wired = 0;
|
|
procpriority(p, PriNormal, 0);
|
|
p->cpu = 0;
|
|
p->lastupdate = sys->ticks*Scaling;
|
|
|
|
return p;
|
|
}
|
|
|
|
/*
|
|
* wire this proc to a machine
|
|
*/
|
|
void
|
|
procwired(Proc *p, int bm)
|
|
{
|
|
Proc *pp;
|
|
int i;
|
|
char nwired[MACHMAX];
|
|
Mach *wm, *mp;
|
|
|
|
if(bm < 0){
|
|
/* pick a machine to wire to */
|
|
jehanne_memset(nwired, 0, sizeof(nwired));
|
|
p->wired = 0;
|
|
for(i=0; (pp = psincref(i)) != nil; i++){
|
|
wm = pp->wired;
|
|
if(wm && pp->pid)
|
|
nwired[wm->machno]++;
|
|
psdecref(pp);
|
|
}
|
|
bm = 0;
|
|
for(i=0; i<MACHMAX; i++){
|
|
if((mp = sys->machptr[i]) == nil || !mp->online)
|
|
continue;
|
|
if(nwired[i] < nwired[bm])
|
|
bm = i;
|
|
}
|
|
} else {
|
|
/* use the virtual machine requested */
|
|
bm = bm % MACHMAX;
|
|
}
|
|
|
|
p->wired = sys->machptr[bm];
|
|
p->mp = p->wired;
|
|
}
|
|
|
|
void
|
|
procpriority(Proc *p, int pri, int fixed)
|
|
{
|
|
if(pri >= Npriq)
|
|
pri = Npriq - 1;
|
|
else if(pri < 0)
|
|
pri = 0;
|
|
p->basepri = pri;
|
|
p->priority = pri;
|
|
if(fixed){
|
|
p->fixedpri = 1;
|
|
} else {
|
|
p->fixedpri = 0;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* sleep if a condition is not true. Another process will
|
|
* awaken us after it sets the condition. When we awaken
|
|
* the condition may no longer be true.
|
|
*
|
|
* we lock both the process and the rendezvous to keep r->p
|
|
* and p->r synchronized.
|
|
*/
|
|
void
|
|
sleep(Rendez *r, int (*f)(void*), void *arg)
|
|
{
|
|
Mreg s;
|
|
void (*pt)(Proc*, int, int64_t, int64_t);
|
|
|
|
s = splhi();
|
|
|
|
if(up->nlocks)
|
|
jehanne_print("process %d sleeps with %d locks held, last lock %#p locked at pc %#p, sleep called from %#p\n",
|
|
up->pid, up->nlocks, up->lastlock, lockgetpc(up->lastlock), getcallerpc());
|
|
lock(&r->l);
|
|
lock(&up->rlock);
|
|
if(r->p){
|
|
jehanne_print("double sleep called from %#p, %d %d\n",
|
|
getcallerpc(), r->p->pid, up->pid);
|
|
dumpstack();
|
|
}
|
|
|
|
/*
|
|
* Wakeup only knows there may be something to do by testing
|
|
* r->p in order to get something to lock on.
|
|
* Flush that information out to memory in case the sleep is
|
|
* committed.
|
|
*/
|
|
r->p = up;
|
|
|
|
awake_fell_asleep(up);
|
|
if((*f)(arg)
|
|
|| (up->notepending && !up->notedeferred)
|
|
|| (up->inkernel && awake_should_wake_up(up))){
|
|
/*
|
|
* if condition happened or a note is pending
|
|
* never mind
|
|
*/
|
|
r->p = nil;
|
|
unlock(&up->rlock);
|
|
unlock(&r->l);
|
|
} else {
|
|
/*
|
|
* now we are committed to
|
|
* change state and call scheduler
|
|
*/
|
|
pt = proctrace;
|
|
if(pt)
|
|
pt(up, SSleep, 0, 0);
|
|
up->state = Wakeme;
|
|
up->r = r;
|
|
|
|
/* statistics */
|
|
m->cs++;
|
|
|
|
procsave(up);
|
|
if(setlabel(&up->sched)) {
|
|
/*
|
|
* here when the process is awakened
|
|
*/
|
|
procrestore(up);
|
|
spllo();
|
|
} else {
|
|
/*
|
|
* here to go to sleep (i.e. stop Running)
|
|
*/
|
|
unlock(&up->rlock);
|
|
unlock(&r->l);
|
|
gotolabel(&m->sched);
|
|
}
|
|
}
|
|
|
|
if(up->notepending && !up->notedeferred) {
|
|
up->notepending = 0;
|
|
SleepAwakened:
|
|
splx(s);
|
|
interrupted();
|
|
}
|
|
if(up->inkernel && awake_should_wake_up(up)){
|
|
goto SleepAwakened;
|
|
}
|
|
|
|
splx(s);
|
|
}
|
|
|
|
void
|
|
interrupted(void)
|
|
{
|
|
if(up->procctl == Proc_exitme && up->closingfgrp != nil)
|
|
forceclosefgrp();
|
|
error(Eintr);
|
|
}
|
|
|
|
static int
|
|
tfn(void *arg)
|
|
{
|
|
return up->trend == nil || up->tfn(arg);
|
|
}
|
|
|
|
void
|
|
twakeup(Ureg* _, Timer *t)
|
|
{
|
|
Proc *p;
|
|
Rendez *trend;
|
|
|
|
ilock(&t->l);
|
|
p = t->ta;
|
|
trend = p->trend;
|
|
if(trend != nil){
|
|
wakeup(trend);
|
|
p->trend = nil;
|
|
}
|
|
iunlock(&t->l);
|
|
}
|
|
|
|
static void
|
|
stoptimer(void)
|
|
{
|
|
if(up->trend != nil || up->tt){
|
|
up->trend = nil;
|
|
timerdel(up);
|
|
}
|
|
}
|
|
|
|
void
|
|
tsleep(Rendez *r, int (*fn)(void*), void *arg, int64_t ms)
|
|
{
|
|
if (up->tt){
|
|
jehanne_print("%s %lud: tsleep timer active: mode %d, tf %#p, pc %#p\n",
|
|
up->text, up->pid, up->tmode, up->tf, __builtin_return_address(0));
|
|
timerdel(up);
|
|
}
|
|
up->tns = MS2NS(ms);
|
|
up->tf = twakeup;
|
|
up->tmode = Trelative;
|
|
up->ta = up;
|
|
up->trend = r;
|
|
up->tfn = fn;
|
|
timeradd(up);
|
|
|
|
if(waserror()){
|
|
stoptimer();
|
|
nexterror();
|
|
}
|
|
sleep(r, tfn, arg);
|
|
stoptimer();
|
|
poperror();
|
|
}
|
|
|
|
/*
|
|
* Expects that only one process can call wakeup for any given Rendez.
|
|
* We hold both locks to ensure that r->p and p->r remain consistent.
|
|
* Richard Miller has a better solution that doesn't require both to
|
|
* be held simultaneously, but I'm a paranoid - presotto.
|
|
*/
|
|
Proc*
|
|
wakeup(Rendez *r)
|
|
{
|
|
Mreg s;
|
|
Proc *p;
|
|
|
|
s = splhi();
|
|
|
|
lock(&r->l);
|
|
p = r->p;
|
|
|
|
if(p != nil){
|
|
lock(&p->rlock);
|
|
if(p->state != Wakeme || p->r != r)
|
|
panic("wakeup: state %d %d %d pc %#p", r->p != p, p->r != r, p->state, __builtin_return_address(0));
|
|
r->p = nil;
|
|
p->r = nil;
|
|
ready(p);
|
|
unlock(&p->rlock);
|
|
}
|
|
unlock(&r->l);
|
|
|
|
splx(s);
|
|
|
|
return p;
|
|
}
|
|
|
|
/*
|
|
* if waking a sleeping process, this routine must hold both
|
|
* p->rlock and r->lock. However, it can't know them in
|
|
* the same order as wakeup causing a possible lock ordering
|
|
* deadlock. We break the deadlock by giving up the p->rlock
|
|
* lock if we can't get the r->lock and retrying.
|
|
*/
|
|
int
|
|
postnote(Proc *p, int dolock, char *n, int flag)
|
|
{
|
|
Mreg s;
|
|
int ret;
|
|
Rendez *r;
|
|
|
|
if(dolock)
|
|
qlock(&p->debug);
|
|
|
|
if(flag != NUser && (p->notify == 0 || p->notified))
|
|
p->nnote = 0;
|
|
|
|
ret = 0;
|
|
if(p->nnote < NNOTE) {
|
|
jehanne_strcpy(p->note[p->nnote].msg, n);
|
|
p->note[p->nnote++].flag = flag;
|
|
ret = 1;
|
|
}
|
|
p->notepending = 1;
|
|
if(dolock)
|
|
qunlock(&p->debug);
|
|
|
|
if(p->notedeferred){
|
|
if(flag == NUser)
|
|
return ret;
|
|
/* do not defer fatal errors and kill through ctl */
|
|
p->notedeferred = 0;
|
|
}
|
|
|
|
/* this loop is to avoid lock ordering problems. */
|
|
for(;;){
|
|
s = splhi();
|
|
lock(&p->rlock);
|
|
r = p->r;
|
|
|
|
/* waiting for a wakeup? */
|
|
if(r == nil)
|
|
break; /* no */
|
|
|
|
/* try for the second lock */
|
|
if(canlock(&r->l)){
|
|
if(p->state != Wakeme || r->p != p)
|
|
panic("postnote: state %d %d %d", r->p != p, p->r != r, p->state);
|
|
p->r = nil;
|
|
r->p = nil;
|
|
ready(p);
|
|
unlock(&r->l);
|
|
break;
|
|
}
|
|
|
|
/* give other process time to get out of critical section and try again */
|
|
unlock(&p->rlock);
|
|
splx(s);
|
|
sched();
|
|
}
|
|
unlock(&p->rlock);
|
|
splx(s);
|
|
|
|
proc_interrupt_finalize(p);
|
|
return ret;
|
|
}
|
|
|
|
int
|
|
proc_interrupt_finalize(Proc *p)
|
|
{
|
|
QLock *q;
|
|
int done = 0;
|
|
switch(p->state){
|
|
default:
|
|
return 1;
|
|
case Queueing:
|
|
/* Try and pull out of a eqlock */
|
|
if((q = p->eql) != nil){
|
|
lock(&q->use);
|
|
if(p->state == Queueing && p->eql == q){
|
|
Proc *d, *l;
|
|
for(l = nil, d = q->head; d != nil; l = d, d = d->qnext){
|
|
if(d == p){
|
|
if(l != nil)
|
|
l->qnext = p->qnext;
|
|
else
|
|
q->head = p->qnext;
|
|
if(p->qnext == nil)
|
|
q->tail = l;
|
|
p->qnext = nil;
|
|
p->eql = nil; /* not taken */
|
|
ready(p);
|
|
done = 1;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
unlock(&q->use);
|
|
return done;
|
|
}
|
|
/* not an eqlock */
|
|
return 0;
|
|
case Rendezvous:
|
|
/* Try and pull out of a rendezvous */
|
|
lock(&p->rgrp->l);
|
|
if(p->state == Rendezvous) {
|
|
p->rendval = ~0;
|
|
if(p->rendtag == ~0){
|
|
/* In Jehanne the rendezvous point ~0
|
|
* is "private" to each process so
|
|
* it is not added to the rgrp (see sysrendezvous)
|
|
*/
|
|
ready(p);
|
|
done = 1;
|
|
goto RendezvousCompleted;
|
|
}
|
|
Proc *d, **l;
|
|
|
|
l = &REND(p->rgrp, p->rendtag);
|
|
for(d = *l; d != nil; d = d->rendhash) {
|
|
if(d == p) {
|
|
*l = p->rendhash;
|
|
p->rendval = ~0;
|
|
ready(p);
|
|
done = 1;
|
|
break;
|
|
}
|
|
l = &d->rendhash;
|
|
}
|
|
}
|
|
RendezvousCompleted:
|
|
unlock(&p->rgrp->l);
|
|
return done;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* prevent application notes within a control request that must complete
|
|
*/
|
|
void
|
|
notedefer(void)
|
|
{
|
|
int s;
|
|
|
|
s = splhi();
|
|
if(up->notedeferred)
|
|
panic("notedefer");
|
|
if(up->notepending){
|
|
up->notepending = 0;
|
|
splx(s);
|
|
error(Eintr);
|
|
}
|
|
up->notedeferred = 1;
|
|
splx(s);
|
|
}
|
|
|
|
void
|
|
noteallow(void)
|
|
{
|
|
up->notedeferred = 0;
|
|
/* trap or a later sleep will process the note */
|
|
}
|
|
|
|
/*
|
|
* weird thing: keep at most NBROKEN around
|
|
*/
|
|
#define NBROKEN 4
|
|
struct
|
|
{
|
|
QLock;
|
|
int n;
|
|
Proc *p[NBROKEN];
|
|
}broken;
|
|
|
|
void
|
|
addbroken(Proc *p)
|
|
{
|
|
qlock(&broken);
|
|
if(broken.n == NBROKEN) {
|
|
ready(broken.p[0]);
|
|
jehanne_memmove(&broken.p[0], &broken.p[1], sizeof(Proc*)*(NBROKEN-1));
|
|
--broken.n;
|
|
}
|
|
broken.p[broken.n++] = p;
|
|
qunlock(&broken);
|
|
|
|
dumpaproc(p);
|
|
dumpregs(p->dbgreg);
|
|
|
|
p->state = Broken;
|
|
p->psstate = 0;
|
|
sched();
|
|
}
|
|
|
|
void
|
|
unbreak(Proc *p)
|
|
{
|
|
int b;
|
|
|
|
qlock(&broken);
|
|
for(b=0; b < broken.n; b++)
|
|
if(broken.p[b] == p) {
|
|
broken.n--;
|
|
jehanne_memmove(&broken.p[b], &broken.p[b+1],
|
|
sizeof(Proc*)*(NBROKEN-(b+1)));
|
|
ready(p);
|
|
break;
|
|
}
|
|
qunlock(&broken);
|
|
}
|
|
|
|
int
|
|
freebroken(void)
|
|
{
|
|
int i, n;
|
|
|
|
qlock(&broken);
|
|
n = broken.n;
|
|
for(i=0; i<n; i++) {
|
|
ready(broken.p[i]);
|
|
broken.p[i] = 0;
|
|
}
|
|
broken.n = 0;
|
|
qunlock(&broken);
|
|
return n;
|
|
}
|
|
|
|
void
|
|
pexit(char *exitstr, int freemem)
|
|
{
|
|
Proc *p;
|
|
ProcSegment **s, **es;
|
|
long utime, stime;
|
|
Waitq *wq;
|
|
Fgrp *fgrp;
|
|
Egrp *egrp;
|
|
Rgrp *rgrp;
|
|
Pgrp *pgrp;
|
|
Chan *dot;
|
|
void (*pt)(Proc*, int, int64_t, int64_t);
|
|
|
|
up->alarm = 0;
|
|
up->blockingfd = -1;
|
|
awake_gc_proc(up);
|
|
if (up->tt)
|
|
timerdel(up);
|
|
pt = proctrace;
|
|
if(pt)
|
|
pt(up, SDead, 0, 0);
|
|
|
|
/* nil out all the resources under lock (free later) */
|
|
qlock(&up->debug);
|
|
fgrp = up->fgrp;
|
|
up->fgrp = nil;
|
|
egrp = up->egrp;
|
|
up->egrp = nil;
|
|
rgrp = up->rgrp;
|
|
up->rgrp = nil;
|
|
pgrp = up->pgrp;
|
|
up->pgrp = nil;
|
|
dot = up->dot;
|
|
up->dot = nil;
|
|
qunlock(&up->debug);
|
|
|
|
if(fgrp)
|
|
closefgrp(fgrp);
|
|
if(egrp)
|
|
closeegrp(egrp);
|
|
if(rgrp)
|
|
closergrp(rgrp);
|
|
if(dot)
|
|
cclose(dot);
|
|
if(pgrp)
|
|
closepgrp(pgrp);
|
|
|
|
/*
|
|
* if not a kernel process and have a parent,
|
|
* do some housekeeping.
|
|
*/
|
|
if(up->kp == 0) {
|
|
p = up->parent;
|
|
if(p == 0) {
|
|
if(exitstr == 0)
|
|
exitstr = "unknown";
|
|
panic("boot process died: %s", exitstr);
|
|
}
|
|
|
|
while(waserror())
|
|
;
|
|
|
|
wq = smalloc(sizeof(Waitq));
|
|
poperror();
|
|
|
|
wq->w.pid = up->pid;
|
|
utime = up->time[TUser] + up->time[TCUser];
|
|
stime = up->time[TSys] + up->time[TCSys];
|
|
wq->w.time[TUser] = tk2ms(utime);
|
|
wq->w.time[TSys] = tk2ms(stime);
|
|
wq->w.time[TReal] = tk2ms(sys->ticks - up->time[TReal]);
|
|
if(exitstr && exitstr[0])
|
|
jehanne_snprint(wq->w.msg, sizeof(wq->w.msg), "%s %d: %s",
|
|
up->text, up->pid, exitstr);
|
|
else
|
|
wq->w.msg[0] = '\0';
|
|
|
|
lock(&p->exl);
|
|
/*
|
|
* Check that parent is still alive.
|
|
*/
|
|
if(p->pid == up->parentpid && p->state != Broken) {
|
|
p->nchild--;
|
|
p->time[TCUser] += utime;
|
|
p->time[TCSys] += stime;
|
|
/*
|
|
* If there would be more than 2000 wait records
|
|
* processes for my parent, then don't leave a wait
|
|
* record behind. This helps prevent badly written
|
|
* daemon processes from accumulating lots of wait
|
|
* records.
|
|
*/
|
|
if(p->nwait < 2000) {
|
|
wq->next = p->waitq;
|
|
p->waitq = wq;
|
|
p->nwait++;
|
|
wq = nil;
|
|
wakeup(&p->waitr);
|
|
}
|
|
}
|
|
unlock(&p->exl);
|
|
if(wq)
|
|
jehanne_free(wq);
|
|
}
|
|
|
|
if(!freemem)
|
|
addbroken(up);
|
|
|
|
wlock(&up->seglock);
|
|
es = &up->seg[NSEG];
|
|
for(s = up->seg; s < es; s++) {
|
|
if(*s)
|
|
segment_release(s);
|
|
}
|
|
wunlock(&up->seglock);
|
|
|
|
lock(&up->exl); /* Prevent my children from leaving waits */
|
|
psunhash(up);
|
|
up->pid = 0;
|
|
wakeup(&up->waitr);
|
|
unlock(&up->exl);
|
|
|
|
while((wq = up->waitq) != nil){
|
|
up->waitq = wq->next;
|
|
jehanne_free(wq);
|
|
}
|
|
|
|
/* release debuggers */
|
|
qlock(&up->debug);
|
|
if(up->syscallq != nil){
|
|
qhangup(up->syscallq, nil);
|
|
up->syscallq = nil;
|
|
}
|
|
if(up->pdbg) {
|
|
wakeup(&up->pdbg->sleep);
|
|
up->pdbg = 0;
|
|
}
|
|
qunlock(&up->debug);
|
|
|
|
/* Sched must not loop for these locks */
|
|
lock(&procalloc.l);
|
|
|
|
up->state = Moribund;
|
|
sched();
|
|
panic("pexit");
|
|
}
|
|
|
|
int
|
|
haswaitq(void *x)
|
|
{
|
|
Proc *p;
|
|
|
|
p = (Proc *)x;
|
|
return p->waitq != 0;
|
|
}
|
|
|
|
int
|
|
pwait(Waitmsg *w)
|
|
{
|
|
int cpid;
|
|
Waitq *wq;
|
|
|
|
if(!canqlock(&up->qwaitr))
|
|
error(Einuse);
|
|
|
|
if(waserror()) {
|
|
qunlock(&up->qwaitr);
|
|
nexterror();
|
|
}
|
|
|
|
lock(&up->exl);
|
|
while(up->waitq == nil) {
|
|
if(up->nchild == 0) {
|
|
unlock(&up->exl);
|
|
error(Enochild);
|
|
}
|
|
unlock(&up->exl);
|
|
sleep(&up->waitr, haswaitq, up);
|
|
lock(&up->exl);
|
|
}
|
|
wq = up->waitq;
|
|
up->waitq = wq->next;
|
|
up->nwait--;
|
|
unlock(&up->exl);
|
|
|
|
qunlock(&up->qwaitr);
|
|
poperror();
|
|
|
|
if(w != nil)
|
|
jehanne_memmove(w, &wq->w, sizeof(Waitmsg));
|
|
cpid = wq->w.pid;
|
|
jehanne_free(wq);
|
|
|
|
return cpid;
|
|
}
|
|
|
|
void
|
|
dumpaproc(Proc *p)
|
|
{
|
|
uintptr_t bss;
|
|
char *s;
|
|
|
|
if(p == 0)
|
|
return;
|
|
|
|
bss = 0;
|
|
rlock(&p->seglock);
|
|
if(p->seg[BSEG])
|
|
bss = p->seg[BSEG]->top;
|
|
runlock(&p->seglock);
|
|
|
|
s = p->psstate;
|
|
if(s == 0)
|
|
s = statename[p->state];
|
|
jehanne_print("%3d:%10s %#p pc %#p dbgpc %#p %8s (%s) ut %ld st %ld bss %#p qpc %#p nl %d nd %lud lpc %#p pri %lud wkps %d/%d[%#p,%#p]\n",
|
|
p->pid, p->text, p, p->pc, dbgpc(p), s, statename[p->state],
|
|
p->time[0], p->time[1], bss, p->qpc, p->nlocks,
|
|
p->delaysched, p->lastlock ? lockgetpc(p->lastlock) : 0, p->priority,
|
|
p->wakeups[0].count, p->wakeups[1].count, p->wakeups[0].elapsed, p->wakeups[1].elapsed
|
|
);
|
|
}
|
|
|
|
void
|
|
procdump(void)
|
|
{
|
|
int i;
|
|
Proc *p;
|
|
|
|
if(up)
|
|
jehanne_print("up %d\n", up->pid);
|
|
else
|
|
jehanne_print("no current process\n");
|
|
for(i=0; (p = psincref(i)) != nil; i++) {
|
|
if(p->state != Dead)
|
|
dumpaproc(p);
|
|
psdecref(p);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* must be called in trap, at least on clock interrupt,
|
|
* to check and clear the flushmmu flag set above
|
|
*/
|
|
void
|
|
checkflushmmu(void)
|
|
{
|
|
if(m->mmuflush){
|
|
if(up)
|
|
mmuflush();
|
|
m->mmuflush = 0;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* wait till all processes have flushed their mmu
|
|
* state about the given segment
|
|
*/
|
|
void
|
|
procs_flush_segment(ProcSegment *s)
|
|
{
|
|
int i, ns, nm, nwait;
|
|
Proc *p;
|
|
Mach *mp;
|
|
|
|
/*
|
|
* tell all processes with the same set
|
|
* of pages to flush their mmus
|
|
*/
|
|
nwait = 0;
|
|
for(i=0; (p = psincref(i)) != nil; i++) {
|
|
if(p->state == Dead){
|
|
psdecref(p);
|
|
continue;
|
|
}
|
|
if(p != up)
|
|
rlock(&p->seglock);
|
|
for(ns = 0; ns < NSEG; ns++){
|
|
if(p->seg[ns] == s){
|
|
p->newtlb = 1;
|
|
for(nm = 0; nm < MACHMAX; nm++){
|
|
if((mp = sys->machptr[nm]) == nil || !mp->online)
|
|
continue;
|
|
if(mp->proc == p){
|
|
mp->mmuflush = 1;
|
|
nwait++;
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if(p != up)
|
|
runlock(&p->seglock);
|
|
psdecref(p);
|
|
}
|
|
|
|
if(nwait == 0)
|
|
return;
|
|
|
|
/*
|
|
* wait for all processors to take a clock interrupt
|
|
* and flush their mmu's
|
|
*/
|
|
for(i = 0; i < MACHMAX; i++){
|
|
if((mp = sys->machptr[i]) == nil || !mp->online || mp == m)
|
|
continue;
|
|
while(mp->mmuflush)
|
|
sched();
|
|
}
|
|
}
|
|
|
|
void
|
|
scheddump(void)
|
|
{
|
|
Proc *p;
|
|
Schedq *rq;
|
|
|
|
for(rq = &runq[Npriq-1]; rq >= runq; rq--){
|
|
if(rq->head == 0)
|
|
continue;
|
|
jehanne_print("rq%ld:", rq-runq);
|
|
for(p = rq->head; p; p = p->rnext)
|
|
jehanne_print(" %d(%llud)", p->pid, m->ticks - p->readytime);
|
|
jehanne_print("\n");
|
|
delay(150);
|
|
}
|
|
jehanne_print("nrdy %d\n", nrdy);
|
|
}
|
|
|
|
void
|
|
kproc(char *name, void (*func)(void *), void *arg)
|
|
{
|
|
Proc *p;
|
|
static Pgrp *kpgrp;
|
|
|
|
while(waserror())
|
|
{}
|
|
p = newproc();
|
|
poperror();
|
|
|
|
p->psstate = 0;
|
|
p->procmode = 0640;
|
|
p->kp = 1;
|
|
|
|
p->scallnr = up->scallnr;
|
|
jehanne_memmove(p->arg, up->arg, sizeof(up->arg));
|
|
p->nerrlab = 0;
|
|
p->slash = up->slash;
|
|
p->dot = up->dot;
|
|
if(p->dot)
|
|
incref(&p->dot->r);
|
|
|
|
jehanne_memmove(p->note, up->note, sizeof(p->note));
|
|
p->nnote = up->nnote;
|
|
p->notified = 0;
|
|
p->lastnote = up->lastnote;
|
|
p->notify = up->notify;
|
|
p->ureg = 0;
|
|
p->dbgreg = 0;
|
|
|
|
procpriority(p, PriKproc, 0);
|
|
|
|
kprocchild(p, func, arg);
|
|
|
|
kstrdup(&p->user, eve);
|
|
kstrdup(&p->text, name);
|
|
if(kpgrp == 0)
|
|
kpgrp = newpgrp();
|
|
p->pgrp = kpgrp;
|
|
incref(&kpgrp->r);
|
|
|
|
jehanne_memset(p->time, 0, sizeof(p->time));
|
|
p->time[TReal] = sys->ticks;
|
|
// pickmach(p);
|
|
ready(p);
|
|
}
|
|
|
|
/*
|
|
* called splhi() by notify(). See comment in notify for the
|
|
* reasoning.
|
|
*/
|
|
void
|
|
procctl(Proc *p)
|
|
{
|
|
Mreg s;
|
|
char *state;
|
|
|
|
switch(p->procctl) {
|
|
case Proc_exitbig:
|
|
spllo();
|
|
pexit("Killed: Insufficient physical memory", 1);
|
|
|
|
case Proc_exitme:
|
|
spllo(); /* pexit has locks in it */
|
|
pexit("Killed", 1);
|
|
|
|
case Proc_traceme:
|
|
if(p->nnote == 0)
|
|
return;
|
|
/* No break */
|
|
|
|
case Proc_stopme:
|
|
p->procctl = 0;
|
|
state = p->psstate;
|
|
p->psstate = "Stopped";
|
|
/* free a waiting debugger */
|
|
s = spllo();
|
|
qlock(&p->debug);
|
|
if(p->pdbg) {
|
|
wakeup(&p->pdbg->sleep);
|
|
p->pdbg = 0;
|
|
}
|
|
qunlock(&p->debug);
|
|
splhi();
|
|
p->state = Stopped;
|
|
sched();
|
|
p->psstate = state;
|
|
splx(s);
|
|
return;
|
|
}
|
|
}
|
|
|
|
void
|
|
errorf(char *fmt, ...)
|
|
{
|
|
va_list arg;
|
|
char buf[PRINTSIZE];
|
|
|
|
va_start(arg, fmt);
|
|
jehanne_vseprint(buf, buf+sizeof(buf), fmt, arg);
|
|
va_end(arg);
|
|
error(buf);
|
|
}
|
|
|
|
void
|
|
error(char *err)
|
|
{
|
|
errorl(err, -1);
|
|
}
|
|
|
|
void
|
|
errorl(char *err, long syscallerr)
|
|
{
|
|
if(up == nil)
|
|
panic("errorl(%s, %lld) not in a process", err, syscallerr);
|
|
spllo();
|
|
|
|
if(up->nerrlab >= NERR)
|
|
panic("error stack too deep");
|
|
up->syscallerr = syscallerr;
|
|
if(err != nil)
|
|
kstrcpy(up->errstr, err, ERRMAX);
|
|
setlabel(&up->errlab[NERR-1]);
|
|
nexterror();
|
|
}
|
|
|
|
void
|
|
nexterror(void)
|
|
{
|
|
if(up->nerrlab <= 0)
|
|
labtrap("nexterror");
|
|
gotolabel(&up->errlab[--up->nerrlab]);
|
|
}
|
|
|
|
int
|
|
labtrap(char *source)
|
|
{
|
|
static Lock l;
|
|
int i;
|
|
|
|
ilock(&l);
|
|
jehanne_print("labtrap (%s):\n", source);
|
|
for (i=NERR-1; i>=0; i--)
|
|
if (up->errlab[i].pc)
|
|
jehanne_print("%d: sp=%#p pc=%#p\n", i, up->errlab[i].sp, up->errlab[i].pc);
|
|
iunlock(&l);
|
|
delay(3*1000); /* delay to let cons queue drain */
|
|
panic(source);
|
|
return 1;
|
|
}
|
|
|
|
void
|
|
labassert(int nerrlab)
|
|
{
|
|
if (up->nerrlab != nerrlab)
|
|
labtrap("labassert");
|
|
}
|
|
|
|
void
|
|
exhausted(char *resource)
|
|
{
|
|
char buf[ERRMAX];
|
|
|
|
jehanne_sprint(buf, "no free %s", resource);
|
|
iprint("%s\n", buf);
|
|
error(buf);
|
|
}
|
|
|
|
/*
|
|
* neither p nor its segments are necessarily locked
|
|
*/
|
|
uint32_t
|
|
procdatasize(Proc *p, int addstack)
|
|
{
|
|
ProcSegment *s;
|
|
uint32_t tot, l;
|
|
int i, n;
|
|
|
|
tot = 0;
|
|
for(i = 1; i < NSEG; i++){
|
|
s = p->seg[i];
|
|
if(s != nil && (i != SSEG || addstack)){
|
|
l = s->top - s->base;
|
|
n = s->r.ref;
|
|
if(n > 1)
|
|
l /= n;
|
|
if(p->seg[i] == s) /* ie, hasn't changed meanwhile */
|
|
tot += l;
|
|
}
|
|
}
|
|
return tot;
|
|
}
|
|
|
|
int
|
|
cankillproc(Proc *p)
|
|
{
|
|
if(p->kp)
|
|
return 0;
|
|
if(p->state == Dead || p->state == Moribund)
|
|
return 0;
|
|
if(p->procctl == Proc_exitbig || p->procctl == Proc_exitme)
|
|
return 0;
|
|
return jehanne_strcmp(p->user, eve) != 0 || (p->procmode&0222) != 0;
|
|
}
|
|
|
|
enum{
|
|
Nbig= 8
|
|
};
|
|
|
|
static uint32_t
|
|
findbignoteid(void)
|
|
{
|
|
int i, nbig;
|
|
uint32_t l, noteid, noteids[Nbig], sizes[Nbig], t;
|
|
Proc *p;
|
|
int j;
|
|
|
|
jehanne_memset(sizes, 0, sizeof(sizes));
|
|
jehanne_memset(noteids, 0, sizeof(noteids));
|
|
nbig = 0;
|
|
for(j = 0; (p = psincref(j)) != nil; j++){
|
|
if(cankillproc(p)){
|
|
noteid = p->noteid;
|
|
l = procdatasize(p, 1);
|
|
if(l < 4*MB)
|
|
continue;
|
|
for(i = 0; i < nbig; i++){
|
|
if(noteid == noteids[i]){
|
|
if(l > sizes[i])
|
|
sizes[i] = l;
|
|
break;
|
|
}
|
|
if(l > sizes[i]){
|
|
t = noteids[i]; noteids[i] = noteid; noteid = t;
|
|
t = sizes[i]; sizes[i] = l; l = t;
|
|
}
|
|
}
|
|
if(i == nbig && nbig < nelem(noteids)){
|
|
noteids[nbig] = noteid;
|
|
sizes[nbig] = l;
|
|
nbig++;
|
|
}
|
|
}
|
|
psdecref(p);
|
|
}
|
|
noteid = 0;
|
|
l = 0;
|
|
for(i = 0; i < nbig; i++){
|
|
if(noteids[i] > noteid && sizes[i] > l/2){
|
|
noteid = noteids[i];
|
|
l = sizes[i];
|
|
}
|
|
}
|
|
return noteid;
|
|
}
|
|
|
|
void
|
|
killbig(char *why)
|
|
{
|
|
uint32_t noteid;
|
|
Proc *p;
|
|
int i;
|
|
|
|
noteid = findbignoteid();
|
|
if(noteid == 0)
|
|
return;
|
|
for(i = 0; (p = psincref(i)) != nil; i++){
|
|
if(p->noteid == noteid && canqlock(&p->debug)){
|
|
if(p->noteid == noteid && cankillproc(p)){
|
|
jehanne_print("%ud: %s killed: %s\n", p->pid, p->text, why);
|
|
prockill(p, Proc_exitbig, why);
|
|
}
|
|
qunlock(&p->debug);
|
|
}
|
|
psdecref(p);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* must hold the lock p->debug
|
|
*/
|
|
void
|
|
prockill(Proc *p, int ctl, char *why)
|
|
{
|
|
switch(p->state) {
|
|
case Broken:
|
|
unbreak(p);
|
|
break;
|
|
case Stopped:
|
|
p->procctl = ctl;
|
|
postnote(p, 0, why, NExit);
|
|
ready(p);
|
|
break;
|
|
default:
|
|
p->procctl = ctl;
|
|
postnote(p, 0, why, NExit);
|
|
break;
|
|
}
|
|
}
|
|
|
|
/*
|
|
* change ownership to 'new' of all processes owned by 'old'. Used when
|
|
* eve changes.
|
|
*/
|
|
void
|
|
renameuser(char *old, char *new)
|
|
{
|
|
int i;
|
|
Proc *p;
|
|
|
|
for(i = 0; (p = psincref(i)) != nil; i++){
|
|
if(p->user!=nil && jehanne_strcmp(old, p->user)==0)
|
|
kstrdup(&p->user, new);
|
|
psdecref(p);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* time accounting called by clock() splhi'd
|
|
*/
|
|
void
|
|
accounttime(void)
|
|
{
|
|
Proc *p;
|
|
uint64_t n, per;
|
|
static uint32_t nrun;
|
|
|
|
p = m->proc;
|
|
if(p) {
|
|
nrun++;
|
|
p->time[p->inkernel]++;
|
|
}
|
|
|
|
/* calculate decaying duty cycles */
|
|
n = perfticks();
|
|
per = n - m->perf.last;
|
|
m->perf.last = n;
|
|
per = (m->perf.period*(HZ-1) + per)/HZ;
|
|
if(per != 0)
|
|
m->perf.period = per;
|
|
|
|
m->perf.avg_inidle = (m->perf.avg_inidle*(HZ-1)+m->perf.inidle)/HZ;
|
|
m->perf.inidle = 0;
|
|
|
|
m->perf.avg_inintr = (m->perf.avg_inintr*(HZ-1)+m->perf.inintr)/HZ;
|
|
m->perf.inintr = 0;
|
|
|
|
/* only one processor gets to compute system load averages */
|
|
if(m->machno != 0)
|
|
return;
|
|
|
|
/*
|
|
* calculate decaying load average.
|
|
* if we decay by (n-1)/n then it takes
|
|
* n clock ticks to go from load L to .36 L once
|
|
* things quiet down. it takes about 5 n clock
|
|
* ticks to go to zero. so using HZ means this is
|
|
* approximately the load over the last second,
|
|
* with a tail lasting about 5 seconds.
|
|
*/
|
|
n = nrun;
|
|
nrun = 0;
|
|
n = (nrdy+n)*1000;
|
|
m->load = (m->load*(HZ-1)+n)/HZ;
|
|
}
|
|
|