MIT 6.S081入门lab7 多线程
1.xv6 book书籍阅读(Chapter 7: Scheduling through Section 7.4)
- 核心问题:
- 如何安全的完成进程切换
- 切换需要透明+强制->时钟中断的轮转调度机制
- 考虑CPU的并发性->需要锁机制
- 进程资源的释放(注意内核相关资源的实现)
- 系统调用的解决->cpu需要了解当前执行进程是哪一个
- sleep和wake机制带来的wake loss的问题
调度核心思想: 保存上下文,选择进程,恢复状态,执行进程
xv6的区别: xv6核心是针对内核线程进行调度,其调度核心是每个CPU的调度线程,内核态上下文是用户态的子集
核心函数 swtch(a0, a1)(kernel/swtch.S): 实现对a0和a1内核的上下文的切换,其通过切换地址寄存器ra和栈寄存器sp实现了内核线程的切换;
注: swtch只保存被调用者保存的寄存器Callee-saved registers;由调用者保存的寄存器Caller-saved registers 由调用者保存在自己的内核栈上,具体寄存器可以查询lab4的risc-v寄存器章节:; -
xv6调度的完整流程: 用户进程PA->usertrap->内核线程TA->yield(TA)->sched(TA)->swtch(TA, S)->调度线程S->swtch(S, TB)->sched(TB)->yield(TB)->内核线程TB->usertrapret->用户进程PB
# Context switch # # void swtch(struct context *old, struct context *new); # # Save current registers in old. Load from new. .globl swtch swtch: sd ra, 0(a0) sd sp, 8(a0) sd s0, 16(a0) sd s1, 24(a0) sd s2, 32(a0) sd s3, 40(a0) sd s4, 48(a0) sd s5, 56(a0) sd s6, 64(a0) sd s7, 72(a0) sd s8, 80(a0) sd s9, 88(a0) sd s10, 96(a0) sd s11, 104(a0) ld ra, 0(a1) ld sp, 8(a1) ld s0, 16(a1) ld s1, 24(a1) ld s2, 32(a1) ld s3, 40(a1) ld s4, 48(a1) ld s5, 56(a1) ld s6, 64(a1) ld s7, 72(a1) ld s8, 80(a1) ld s9, 88(a1) ld s10, 96(a1) ld s11, 104(a1) ret
3. 代码:调度线程
需要调度线程的原因: 由于在旧线程的内核栈上运行内核栈时,会导致多CPU调度冲突,因此,CPU只能在自己的调度线程内核栈上运行调度器;
调度流程: 陷入trap后,which_dev = 2,usertrap调用yield函数开始调用
yield: 获得进程锁,修改状态,调用sched();
yield kernel/proc.c:521
// Give up the CPU for one scheduling round. void yield(void) { struct proc *p = myproc(); acquire(&p->lock); p->state = RUNNABLE; sched(); release(&p->lock); }
sched: 检查p->lock和其他的锁(通过检查中断嵌套层数),检查进程状态+中断状态, 调取mycpu,使用swtch切换进入cpu线程(调度线程)
sched kernel/proc.c:494
// Switch to scheduler. Must hold only p->lock // and have changed proc->state. Saves and restores // intena because intena is a property of this // kernel thread, not this CPU. It should // be proc->intena and proc->noff, but that would // break in the few places where a lock is held but // there's no process. void sched(void) { int intena; struct proc *p = myproc(); if(!holding(&p->lock)) panic("sched p->lock"); if(mycpu()->noff != 1) panic("sched locks"); if(p->state == RUNNING) panic("sched running"); if(intr_get()) panic("sched interruptible"); intena = mycpu()->intena; swtch(&p->context, &mycpu()->context); mycpu()->intena = intena; }
scheduler: 使用循环寻找下一个需要执行的内核线程,并设定状态和运行空间,同时使用swtch切换回到内核线程的sched
scheduler kernel/proc.c
/ Per-CPU process scheduler. // Each CPU calls scheduler() after setting itself up. // Scheduler never returns. It loops, doing: // - choose a process to run. // - swtch to start running that process. // - eventually that process transfers control // via swtch back to the scheduler. void scheduler(void) { struct proc *p; struct cpu *c = mycpu(); c->proc = 0; for(;;){ // Avoid deadlock by ensuring that devices can interrupt. intr_on(); int nproc = 0; for(p = proc; p < &proc[NPROC]; p++) { acquire(&p->lock); if(p->state != UNUSED) { nproc++; } if(p->state == RUNNABLE) { // Switch to chosen process. It is the process's job // to release its lock and then reacquire it // before jumping back to us. p->state = RUNNING; c->proc = p; swtch(&c->context, &p->context); // Process is done running for now. // It should have changed its p->state before coming back. c->proc = 0; } release(&p->lock); } if(nproc <= 2) { // only init and sh exist intr_on(); asm volatile("wfi"); } } }
核心: sched和scheduler表现为一对协同程序,通过不同内核线程的sched和scheduler通过swtch切换实现
例外: 进程创建时,在allocproc中将ra设置为forkret,调度通过forkret直接返回到用户空间中、
allocproc kernel/proc.c
// Look in the process table for an UNUSED proc. // If found, initialize state required to run in the kernel, // and return with p->lock held. // If there are no free procs, or a memory allocation fails, return 0. static struct proc* allocproc(void) { struct proc *p; for(p = proc; p < &proc[NPROC]; p++) { acquire(&p->lock); if(p->state == UNUSED) { goto found; } else { release(&p->lock); } } return 0; found: p->pid = allocpid(); // Allocate a trapframe page. if((p->trapframe = (struct trapframe *)kalloc()) == 0){ release(&p->lock); return 0; } // An empty user page table. p->pagetable = proc_pagetable(p); if(p->pagetable == 0){ freeproc(p); release(&p->lock); return 0; } // Set up new context to start executing at forkret, // which returns to user space. memset(&p->context, 0, sizeof(p->context)); p->context.ra = (uint64)forkret; //调用forkret p->context.sp = p->kstack + PGSIZE; return p; }
forkret kernel/proc.c
// A fork child's very first scheduling by scheduler() // will swtch to forkret. void forkret(void) { static int first = 1; // Still holding p->lock from scheduler. release(&myproc()->lock); if (first) { // File system initialization must be run in the context of a // regular process (e.g., because it calls sleep), and thus cannot // be run from main(). first = 0; fsinit(ROOTDEV); } usertrapret();//直接返回用户空间 }
p->lock的保护: 在调度过程完成之前,保持该内核栈不被其他CPU运行
- 改变进程状态为RUNNABLE,防止进程状态的不一致。
- swtch发生的上下文切换,防止保存和恢复寄存器不完整。
- 停止使用当前内核线程的内核栈,因此防止两个CPU使用同一个内核栈。
- 其他:exit和wait之间的交互,避免唤醒丢失,进程在exit时产生的竞争条件等。
4.代码 Mycpu 和 Myproc
- 多cpu维护当前cpu运行进程的解决方案: 使用每个cpu的寄存器集合;
struct cpu结构保存了进程结构、调度上下文、中断信息;
struct cpu kernel/proc.h
// Per-CPU state. struct cpu { struct proc *proc; // The process running on this cpu, or null. struct context context; // swtch() here to enter scheduler(). int noff; // Depth of push_off() nesting. int intena; // Were interrupts enabled before push_off()? }; extern struct cpu cpus[NCPU];
r_tp kernel/risc.h
// read and write tp, the thread pointer, which holds // this core's hartid (core number), the index into cpus[]. static inline uint64 r_tp() { uint64 x; asm volatile("mv %0, tp" : "=r" (x) ); return x; }
mycpu,cpuid kernel/proc.c
// Must be called with interrupts disabled, // to prevent race with process being moved // to a different CPU. int cpuid() { int id = r_tp(); return id; } // Return this CPU's cpu struct. // Interrupts must be disabled. struct cpu* mycpu(void) { int id = cpuid(); struct cpu *c = &cpus[id]; return c; }
myproc kernel/myproc
// Return the current struct proc *, or zero if none. struct proc* myproc(void) { push_off(); struct cpu *c = mycpu(); struct proc *p = c->proc; pop_off(); return p; }
二、涉及函数(kernel/proc.c, kernel/swtch.S)
三、课程视频观看笔记(lec 11)
- 线程切换: 需求:多任务处理+线程加速
- 线程: 一种串行执行方式;
- 重要状态:PC、寄存器、堆栈;
- 需求:交错执行;线程切换。
- 如果共享内存时,需要锁
-xv6中,每一个用户进程有着相对应的内核线程(syscall的调度),同时用户进程只有一个线程 - 多任务的其他解决方式:状态机、事件驱动编程。
- 线程的挑战: 进程的切换+调度+保存和恢复+计算密集型线程的处理
- 处理方案:
- 定时器中断划分时间->内核获取控制权->内核调度(用户态抢占型调度,内核态自愿性调度)
- 进程状态:运行、可运行、睡眠
- 需要保存的数据:CPU运行状态:PC+寄存器;
- 用户态进程调度的核心: 内核线程的切换,即内核栈的切换;
- 每个内核CPU都有自己的堆栈,在entry.S中初始化
- 注意: 每个核心同时只在一个运行单一线程
- swtch调换机制: swtch通过ra和sp进行调换,同时,可以通过sp和ra判断当前程序,如果在非常前的地址,则是在cpu的初始化栈中。
- p->lock 的机制: 在yield中上锁,scheduler中释放/在scheduler上锁, yield中释放,保证启动和切换一个进程的过程是原子的。
- 进程切换的核心代码:swtch,保存易失性存储,即cpu的相应寄存器,到内存(非易失存储)
- linux线程:核心是共享内存的进程;
Uthread: switching between threads
... // Saved registers for user context switches. 上下文结构体 struct context { uint64 ra; uint64 sp; // callee-saved uint64 s0; uint64 s1; uint64 s2; uint64 s3; uint64 s4; uint64 s5; uint64 s6; uint64 s7; uint64 s8; uint64 s9; uint64 s10; uint64 s11; }; struct thread { char stack[STACK_SIZE]; /* the thread's stack */ int state; /* FREE, RUNNING, RUNNABLE */ struct context context; /*context struct to save callee reg*/ }; ... void thread_schedule(void) { /* YOUR CODE HERE * Invoke thread_switch to switch from t to next_thread: * thread_switch(??, ??); */ thread_switch((uint64)&(t->context), (uint64)&(next_thread->context)); //调用switch函数切换栈和ra,并保存callee寄存器 } else next_thread = 0; } ... void thread_create(void (*func)()) { t->state = RUNNABLE; // YOUR CODE HERE t->context.ra = (uint64)func; //return to the func addr t->context.sp = (uint64)((char *)&t->stack + (STACK_SIZE - 1)); //保存栈信息(从高往低生长) }
.text /* * save the old thread's registers, * restore the new thread's registers. */ // void thread_switch(struct context *old, struct context *new); .globl thread_switch thread_switch: /* YOUR CODE HERE */ sd ra, 0(a0) sd sp, 8(a0) sd s0, 16(a0) sd s1, 24(a0) sd s2, 32(a0) sd s3, 40(a0) sd s4, 48(a0) sd s5, 56(a0) sd s6, 64(a0) sd s7, 72(a0) sd s8, 80(a0) sd s9, 88(a0) sd s10, 96(a0) sd s11, 104(a0) ld ra, 0(a1) ld sp, 8(a1) ld s0, 16(a1) ld s1, 24(a1) ld s2, 32(a1) ld s3, 40(a1) ld s4, 48(a1) ld s5, 56(a1) ld s6, 64(a1) ld s7, 72(a1) ld s8, 80(a1) ld s9, 88(a1) ld s10, 96(a1) ld s11, 104(a1) ret /* return to ra */
UPROGS=\ ... $U/_uthread\
Using threads
... int nthread = 1; pthread_mutex_t lock[NBUCKET];//互斥锁结构 ... static void put(int key, int value) { int i = key % NBUCKET; pthread_mutex_lock(&lock[i]); //加锁 ... pthread_mutex_unlock(&lock[i]); //解锁 } static struct entry* get(int key) { int i = key % NBUCKET; pthread_mutex_lock(&lock[i]);//加锁 ... pthread_mutex_unlock(&lock[i]);//解锁 return e; } ... int main(int argc, char *argv[]) { ... for (int i = 0; i < NKEYS; i++) { keys[i] = random(); } for (int i = 0; i < NBUCKET; i++) { pthread_mutex_init(&lock[i], NULL); //初始化锁 } // // first the puts // }
static void barrier() { // YOUR CODE HERE //if thread enter the barrier , add nthread and check if nthread == nthread wake and round++else sleep pthread_mutex_lock(&bstate.barrier_mutex); if (++bstate.nthread < nthread) { pthread_cond_wait(&bstate.barrier_cond, &bstate.barrier_mutex); } else { bstate.nthread = 0; bstate.round++; pthread_cond_broadcast(&bstate.barrier_cond); } pthread_mutex_unlock(&bstate.barrier_mutex); // Block until all threads have called barrier() and // then increment bstate.round. // }
