DragonOS/kernel/process/process.c

1131 lines
34 KiB
C
Raw Normal View History

#include "process.h"
#include <common/printk.h>
#include <common/kprint.h>
2022-05-03 07:40:23 +00:00
#include <common/stdio.h>
2022-07-18 08:07:34 +00:00
#include <common/compiler.h>
2022-05-18 10:27:00 +00:00
#include <common/libELF/elf.h>
2022-07-27 13:19:59 +00:00
#include <common/time.h>
2022-07-31 09:09:12 +00:00
#include <common/sys/wait.h>
#include <driver/video/video.h>
#include <driver/usb/usb.h>
2022-07-18 08:07:34 +00:00
#include <exception/gate.h>
#include <filesystem/fat32/fat32.h>
#include <mm/slab.h>
#include <common/spinlock.h>
2022-07-18 08:07:34 +00:00
#include <syscall/syscall.h>
#include <syscall/syscall_num.h>
#include <sched/sched.h>
2022-08-01 03:34:06 +00:00
#include <common/unistd.h>
#include <debug/traceback/traceback.h>
2022-07-18 08:07:34 +00:00
2022-07-26 07:44:01 +00:00
#include <ktest/ktest.h>
2022-05-04 15:20:39 +00:00
// #pragma GCC push_options
// #pragma GCC optimize("O0")
2022-08-01 11:43:21 +00:00
2022-05-04 15:20:39 +00:00
spinlock_t process_global_pid_write_lock; // 增加pid的写锁
2022-05-06 03:44:53 +00:00
long process_global_pid = 1; // 系统中最大的pid
2022-04-13 09:58:06 +00:00
extern void system_call(void);
2022-04-26 05:12:59 +00:00
extern void kernel_thread_func(void);
2022-04-14 08:53:11 +00:00
ul _stack_start; // initial proc的栈基地址虚拟地址
2022-04-13 03:14:49 +00:00
struct mm_struct initial_mm = {0};
struct thread_struct initial_thread =
2022-04-14 08:53:11 +00:00
{
.rbp = (ul)(initial_proc_union.stack + STACK_SIZE / sizeof(ul)),
.rsp = (ul)(initial_proc_union.stack + STACK_SIZE / sizeof(ul)),
.fs = KERNEL_DS,
.gs = KERNEL_DS,
.cr2 = 0,
.trap_num = 0,
.err_code = 0};
2022-04-13 03:14:49 +00:00
// 初始化 初始进程的union ,并将其链接到.data.init_proc段内
union proc_union initial_proc_union __attribute__((__section__(".data.init_proc_union"))) = {INITIAL_PROC(initial_proc_union.pcb)};
struct process_control_block *initial_proc[MAX_CPU_NUM] = {&initial_proc_union.pcb, 0};
// 为每个核心初始化初始进程的tss
struct tss_struct initial_tss[MAX_CPU_NUM] = {[0 ... MAX_CPU_NUM - 1] = INITIAL_TSS};
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_flags(uint64_t clone_flags, struct process_control_block *pcb);
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_files(uint64_t clone_flags, struct process_control_block *pcb);
/**
* @brief
*
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_exit_files(struct process_control_block *pcb);
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_mm(uint64_t clone_flags, struct process_control_block *pcb);
/**
* @brief
*
* @param pcb
* @return uint64_t
*/
uint64_t process_exit_mm(struct process_control_block *pcb);
/**
* @brief 线
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_thread(uint64_t clone_flags, struct process_control_block *pcb, uint64_t stack_start, uint64_t stack_size, struct pt_regs *current_regs);
void process_exit_thread(struct process_control_block *pcb);
/**
* @brief
*
* @param prev pcb
* @param next pcb
*
* fs和gs寄存器
*/
#pragma GCC push_options
#pragma GCC optimize("O0")
void __switch_to(struct process_control_block *prev, struct process_control_block *next)
{
2022-04-13 09:58:06 +00:00
initial_tss[proc_current_cpu_id].rsp0 = next->thread->rbp;
2022-04-26 05:12:59 +00:00
// kdebug("next_rsp = %#018lx ", next->thread->rsp);
// set_tss64((uint *)phys_2_virt(TSS64_Table), initial_tss[0].rsp0, initial_tss[0].rsp1, initial_tss[0].rsp2, initial_tss[0].ist1,
// initial_tss[0].ist2, initial_tss[0].ist3, initial_tss[0].ist4, initial_tss[0].ist5, initial_tss[0].ist6, initial_tss[0].ist7);
__asm__ __volatile__("movq %%fs, %0 \n\t"
: "=a"(prev->thread->fs));
__asm__ __volatile__("movq %%gs, %0 \n\t"
: "=a"(prev->thread->gs));
__asm__ __volatile__("movq %0, %%fs \n\t" ::"a"(next->thread->fs));
__asm__ __volatile__("movq %0, %%gs \n\t" ::"a"(next->thread->gs));
}
#pragma GCC pop_options
/**
* @brief
*
* @param path
* @return struct vfs_file_t*
*/
struct vfs_file_t *process_open_exec_file(char *path)
{
struct vfs_dir_entry_t *dentry = NULL;
struct vfs_file_t *filp = NULL;
dentry = vfs_path_walk(path, 0);
if (dentry == NULL)
return (void *)-ENOENT;
if (dentry->dir_inode->attribute == VFS_ATTR_DIR)
return (void *)-ENOTDIR;
filp = (struct vfs_file_t *)kmalloc(sizeof(struct vfs_file_t), 0);
if (filp == NULL)
return (void *)-ENOMEM;
filp->position = 0;
filp->mode = 0;
filp->dEntry = dentry;
filp->mode = ATTR_READ_ONLY;
filp->file_ops = dentry->dir_inode->file_ops;
return filp;
}
2022-05-18 10:27:00 +00:00
/**
* @brief elf格式的程序文件到内存中regs
*
* @param regs
* @param path
* @return int
*/
static int process_load_elf_file(struct pt_regs *regs, char *path)
{
int retval = 0;
struct vfs_file_t *filp = process_open_exec_file(path);
if ((long)filp <= 0 && (long)filp >= -255)
2022-05-18 10:27:00 +00:00
{
// kdebug("(long)filp=%ld", (long)filp);
2022-05-18 10:27:00 +00:00
return (unsigned long)filp;
}
void *buf = kmalloc(PAGE_4K_SIZE, 0);
memset(buf, 0, PAGE_4K_SIZE);
2022-05-18 10:27:00 +00:00
uint64_t pos = 0;
pos = filp->file_ops->lseek(filp, 0, SEEK_SET);
retval = filp->file_ops->read(filp, (char *)buf, sizeof(Elf64_Ehdr), &pos);
retval = 0;
if (!elf_check(buf))
{
kerror("Not an ELF file: %s", path);
retval = -ENOTSUP;
goto load_elf_failed;
}
#if ARCH(X86_64)
// 暂时只支持64位的文件
if (((Elf32_Ehdr *)buf)->e_ident[EI_CLASS] != ELFCLASS64)
{
kdebug("((Elf32_Ehdr *)buf)->e_ident[EI_CLASS]=%d", ((Elf32_Ehdr *)buf)->e_ident[EI_CLASS]);
retval = -EUNSUPPORTED;
goto load_elf_failed;
}
Elf64_Ehdr ehdr = *(Elf64_Ehdr *)buf;
// 暂时只支持AMD64架构
if (ehdr.e_machine != EM_AMD64)
{
kerror("e_machine=%d", ehdr.e_machine);
retval = -EUNSUPPORTED;
goto load_elf_failed;
}
#else
#error Unsupported architecture!
#endif
if (ehdr.e_type != ET_EXEC)
{
kerror("Not executable file! filename=%s\tehdr->e_type=%d", path, ehdr.e_type);
2022-05-18 10:27:00 +00:00
retval = -EUNSUPPORTED;
goto load_elf_failed;
}
2022-06-07 15:18:26 +00:00
// kdebug("filename=%s:\te_entry=%#018lx", path, ehdr.e_entry);
2022-05-18 10:27:00 +00:00
regs->rip = ehdr.e_entry;
current_pcb->mm->code_addr_start = ehdr.e_entry;
// kdebug("ehdr.e_phoff=%#018lx\t ehdr.e_phentsize=%d, ehdr.e_phnum=%d", ehdr.e_phoff, ehdr.e_phentsize, ehdr.e_phnum);
// 将指针移动到program header处
pos = ehdr.e_phoff;
// 读取所有的phdr
pos = filp->file_ops->lseek(filp, pos, SEEK_SET);
filp->file_ops->read(filp, (char *)buf, (uint64_t)ehdr.e_phentsize * (uint64_t)ehdr.e_phnum, &pos);
2022-05-18 10:27:00 +00:00
if ((unsigned long)filp <= 0)
{
kdebug("(unsigned long)filp=%d", (long)filp);
2022-05-31 13:55:06 +00:00
retval = -ENOEXEC;
goto load_elf_failed;
2022-05-18 10:27:00 +00:00
}
Elf64_Phdr *phdr = buf;
// 将程序加载到内存中
2022-05-18 10:27:00 +00:00
for (int i = 0; i < ehdr.e_phnum; ++i, ++phdr)
{
// kdebug("phdr[%d] phdr->p_offset=%#018lx phdr->p_vaddr=%#018lx phdr->p_memsz=%ld phdr->p_filesz=%ld phdr->p_type=%d", i, phdr->p_offset, phdr->p_vaddr, phdr->p_memsz, phdr->p_filesz, phdr->p_type);
// 不是可加载的段
if (phdr->p_type != PT_LOAD)
continue;
int64_t remain_mem_size = phdr->p_memsz;
int64_t remain_file_size = phdr->p_filesz;
pos = phdr->p_offset;
uint64_t virt_base = phdr->p_vaddr;
2022-06-07 15:18:26 +00:00
// kdebug("virt_base = %#018lx, &memory_management_struct=%#018lx", virt_base, &memory_management_struct);
2022-06-02 06:20:53 +00:00
2022-05-18 10:27:00 +00:00
while (remain_mem_size > 0)
{
// todo: 改用slab分配4K大小内存块并映射到4K页
if (!mm_check_mapped((uint64_t)current_pcb->mm->pgd, virt_base)) // 未映射,则新增物理页
{
2022-07-18 08:07:34 +00:00
mm_map_proc_page_table((uint64_t)current_pcb->mm->pgd, true, virt_base, alloc_pages(ZONE_NORMAL, 1, PAGE_PGT_MAPPED)->addr_phys, PAGE_2M_SIZE, PAGE_USER_PAGE, true, true, false);
2022-06-02 06:20:53 +00:00
2022-05-31 13:55:06 +00:00
memset((void *)virt_base, 0, PAGE_2M_SIZE);
2022-05-18 10:27:00 +00:00
}
pos = filp->file_ops->lseek(filp, pos, SEEK_SET);
int64_t val = 0;
if (remain_file_size != 0)
{
int64_t to_trans = (remain_file_size > PAGE_2M_SIZE) ? PAGE_2M_SIZE : remain_file_size;
val = filp->file_ops->read(filp, (char *)virt_base, to_trans, &pos);
2022-05-18 10:27:00 +00:00
}
if (val < 0)
goto load_elf_failed;
remain_mem_size -= PAGE_2M_SIZE;
remain_file_size -= val;
virt_base += PAGE_2M_SIZE;
}
}
// 分配2MB的栈内存空间
regs->rsp = current_pcb->mm->stack_start;
regs->rbp = current_pcb->mm->stack_start;
2022-06-02 06:20:53 +00:00
uint64_t pa = alloc_pages(ZONE_NORMAL, 1, PAGE_PGT_MAPPED)->addr_phys;
2022-06-07 15:18:26 +00:00
2022-07-18 08:07:34 +00:00
mm_map_proc_page_table((uint64_t)current_pcb->mm->pgd, true, current_pcb->mm->stack_start - PAGE_2M_SIZE, pa, PAGE_2M_SIZE, PAGE_USER_PAGE, true, true, false);
// 清空栈空间
2022-05-31 13:55:06 +00:00
memset((void *)(current_pcb->mm->stack_start - PAGE_2M_SIZE), 0, PAGE_2M_SIZE);
2022-05-18 10:27:00 +00:00
load_elf_failed:;
if (buf != NULL)
kfree(buf);
return retval;
}
/**
* @brief 使
*
* @param regs
* @param path
2022-05-31 13:55:06 +00:00
* @param argv
* @param envp
* @return ul
*/
#pragma GCC push_options
#pragma GCC optimize("O0")
2022-05-31 13:55:06 +00:00
ul do_execve(struct pt_regs *regs, char *path, char *argv[], char *envp[])
{
2022-05-06 03:44:53 +00:00
2022-06-07 15:18:26 +00:00
// kdebug("do_execve is running...");
// 当前进程正在与父进程共享地址空间,需要创建
// 独立的地址空间才能使新程序正常运行
if (current_pcb->flags & PF_VFORK)
{
kdebug("proc:%d creating new mem space", current_pcb->pid);
// 分配新的内存空间分布结构体
struct mm_struct *new_mms = (struct mm_struct *)kmalloc(sizeof(struct mm_struct), 0);
memset(new_mms, 0, sizeof(struct mm_struct));
current_pcb->mm = new_mms;
// 分配顶层页表, 并设置顶层页表的物理地址
new_mms->pgd = (pml4t_t *)virt_2_phys(kmalloc(PAGE_4K_SIZE, 0));
// 由于高2K部分为内核空间在接下来需要覆盖其数据因此不用清零
memset(phys_2_virt(new_mms->pgd), 0, PAGE_4K_SIZE / 2);
// 拷贝内核空间的页表指针
memcpy(phys_2_virt(new_mms->pgd) + 256, phys_2_virt(initial_proc[proc_current_cpu_id]) + 256, PAGE_4K_SIZE / 2);
}
2022-05-31 13:55:06 +00:00
// 设置用户栈和用户堆的基地址
2022-06-02 06:20:53 +00:00
unsigned long stack_start_addr = 0x6ffff0a00000UL;
const uint64_t brk_start_addr = 0x700000000000UL;
process_switch_mm(current_pcb);
// 为用户态程序设置地址边界
if (!(current_pcb->flags & PF_KTHREAD))
2022-04-26 16:39:02 +00:00
current_pcb->addr_limit = USER_MAX_LINEAR_ADDR;
current_pcb->mm->code_addr_end = 0;
current_pcb->mm->data_addr_start = 0;
current_pcb->mm->data_addr_end = 0;
current_pcb->mm->rodata_addr_start = 0;
current_pcb->mm->rodata_addr_end = 0;
current_pcb->mm->bss_start = 0;
current_pcb->mm->bss_end = 0;
2022-05-06 07:29:42 +00:00
current_pcb->mm->brk_start = brk_start_addr;
current_pcb->mm->brk_end = brk_start_addr;
current_pcb->mm->stack_start = stack_start_addr;
// 关闭之前的文件描述符
process_exit_files(current_pcb);
// 清除进程的vfork标志位
current_pcb->flags &= ~PF_VFORK;
2022-05-31 13:55:06 +00:00
// 加载elf格式的可执行文件
int tmp = process_load_elf_file(regs, path);
if (tmp < 0)
goto exec_failed;
2022-05-31 13:55:06 +00:00
// 拷贝参数列表
if (argv != NULL)
{
int argc = 0;
// 目标程序的argv基地址指针最大8个参数
char **dst_argv = (char **)(stack_start_addr - (sizeof(char **) << 3));
uint64_t str_addr = (uint64_t)dst_argv;
for (argc = 0; argc < 8 && argv[argc] != NULL; ++argc)
{
2022-06-07 15:18:26 +00:00
if (*argv[argc] == NULL)
break;
2022-05-31 13:55:06 +00:00
// 测量参数的长度最大1023
int argv_len = strnlen_user(argv[argc], 1023) + 1;
strncpy((char *)(str_addr - argv_len), argv[argc], argv_len - 1);
str_addr -= argv_len;
dst_argv[argc] = (char *)str_addr;
2022-08-01 03:34:06 +00:00
// 字符串加上结尾字符
2022-05-31 13:55:06 +00:00
((char *)str_addr)[argv_len] = '\0';
}
// 重新设定栈基址,并预留空间防止越界
stack_start_addr = str_addr - 8;
current_pcb->mm->stack_start = stack_start_addr;
regs->rsp = regs->rbp = stack_start_addr;
// 传递参数
regs->rdi = argc;
regs->rsi = (uint64_t)dst_argv;
}
2022-07-26 07:44:01 +00:00
// kdebug("execve ok");
2022-05-31 13:55:06 +00:00
regs->cs = USER_CS | 3;
regs->ds = USER_DS | 3;
regs->ss = USER_DS | 0x3;
regs->rflags = 0x200246;
regs->rax = 1;
regs->es = 0;
return 0;
exec_failed:;
process_do_exit(tmp);
}
#pragma GCC pop_options
/**
* @brief init进程
*
* @param arg
* @return ul
*/
#pragma GCC push_options
#pragma GCC optimize("O0")
ul initial_kernel_thread(ul arg)
{
2022-04-12 03:54:44 +00:00
// kinfo("initial proc running...\targ:%#018lx", arg);
2022-04-26 16:39:02 +00:00
fat32_init();
usb_init();
2022-04-26 05:12:59 +00:00
2022-07-28 11:48:20 +00:00
// 对一些组件进行单元测试
2022-07-31 09:09:12 +00:00
uint64_t tpid[] = {
ktest_start(ktest_test_bitree, 0),
ktest_start(ktest_test_kfifo, 0),
ktest_start(ktest_test_mutex, 0),
};
2022-08-01 03:34:06 +00:00
kinfo("Waiting test thread exit...");
2022-07-31 09:09:12 +00:00
// 等待测试进程退出
2022-08-01 03:34:06 +00:00
for (int i = 0; i < sizeof(tpid) / sizeof(uint64_t); ++i)
2022-07-31 09:09:12 +00:00
waitpid(tpid[i], NULL, NULL);
2022-08-01 03:34:06 +00:00
kinfo("All test done.");
// pid_t p = fork();
// if (p == 0)
// {
// kdebug("in subproc, rflags=%#018lx", get_rflags());
// while (1)
// usleep(1000);
// }
// kdebug("subprocess pid=%d", p);
2022-07-28 11:48:20 +00:00
// 准备切换到用户态
struct pt_regs *regs;
// 若在后面这段代码中触发中断return时会导致段选择子错误从而触发#GP因此这里需要cli
cli();
current_pcb->thread->rip = (ul)ret_from_system_call;
current_pcb->thread->rsp = (ul)current_pcb + STACK_SIZE - sizeof(struct pt_regs);
current_pcb->thread->fs = USER_DS | 0x3;
barrier();
current_pcb->thread->gs = USER_DS | 0x3;
// 主动放弃内核线程身份
current_pcb->flags &= (~PF_KTHREAD);
2022-05-31 13:55:06 +00:00
kdebug("in initial_kernel_thread: flags=%ld", current_pcb->flags);
regs = (struct pt_regs *)current_pcb->thread->rsp;
2022-04-12 03:54:44 +00:00
// kdebug("current_pcb->thread->rsp=%#018lx", current_pcb->thread->rsp);
current_pcb->flags = 0;
// 将返回用户层的代码压入堆栈向rdx传入regs的地址然后jmp到do_execve这个系统调用api的处理函数 这里的设计思路和switch_proc类似
2022-05-24 06:36:24 +00:00
// 加载用户态程序shell.elf
char init_path[] = "/shell.elf";
uint64_t addr = (uint64_t)&init_path;
__asm__ __volatile__("movq %1, %%rsp \n\t"
"pushq %2 \n\t"
"jmp do_execve \n\t" ::"D"(current_pcb->thread->rsp),
2022-05-31 13:55:06 +00:00
"m"(current_pcb->thread->rsp), "m"(current_pcb->thread->rip), "S"("/shell.elf"), "c"(NULL), "d"(NULL)
: "memory");
return 1;
}
#pragma GCC pop_options
2022-05-31 13:55:06 +00:00
/**
* @brief 退
*
*/
void process_exit_notify()
{
wait_queue_wakeup(&current_pcb->parent_pcb->wait_child_proc_exit, PROC_INTERRUPTIBLE);
}
/**
* @brief 退
*
* @param code
* @return ul
*/
2022-05-31 13:55:06 +00:00
ul process_do_exit(ul code)
{
// kinfo("process exiting..., code is %ld.", (long)code);
2022-05-31 13:55:06 +00:00
cli();
struct process_control_block *pcb = current_pcb;
// 进程退出时释放资源
process_exit_files(pcb);
process_exit_thread(pcb);
// todo: 可否在这里释放内存结构体?(在判断共享页引用问题之后)
pcb->state = PROC_ZOMBIE;
2022-06-02 06:20:53 +00:00
pcb->exit_code = code;
2022-05-31 13:55:06 +00:00
sti();
process_exit_notify();
sched_cfs();
while (1)
2022-08-01 03:34:06 +00:00
pause();
}
/**
* @brief
*
* @param fn
* @param arg
* @param flags
* @return int
*/
int kernel_thread(unsigned long (*fn)(unsigned long), unsigned long arg, unsigned long flags)
{
struct pt_regs regs;
barrier();
memset(&regs, 0, sizeof(regs));
barrier();
// 在rbx寄存器中保存进程的入口地址
regs.rbx = (ul)fn;
// 在rdx寄存器中保存传入的参数
regs.rdx = (ul)arg;
barrier();
regs.ds = KERNEL_DS;
barrier();
regs.es = KERNEL_DS;
barrier();
regs.cs = KERNEL_CS;
barrier();
regs.ss = KERNEL_DS;
barrier();
// 置位中断使能标志位
regs.rflags = (1 << 9);
barrier();
// rip寄存器指向内核线程的引导程序
regs.rip = (ul)kernel_thread_func;
barrier();
2022-04-26 05:12:59 +00:00
// kdebug("kernel_thread_func=%#018lx", kernel_thread_func);
// kdebug("&kernel_thread_func=%#018lx", &kernel_thread_func);
// kdebug("1111\tregs.rip = %#018lx", regs.rip);
2022-05-04 15:20:39 +00:00
return do_fork(&regs, flags | CLONE_VM, 0, 0);
}
/**
* @brief
*
*/
void process_init()
{
kinfo("Initializing process...");
initial_mm.pgd = (pml4t_t *)get_CR3();
initial_mm.code_addr_start = memory_management_struct.kernel_code_start;
initial_mm.code_addr_end = memory_management_struct.kernel_code_end;
initial_mm.data_addr_start = (ul)&_data;
initial_mm.data_addr_end = memory_management_struct.kernel_data_end;
initial_mm.rodata_addr_start = (ul)&_rodata;
initial_mm.rodata_addr_end = (ul)&_erodata;
2022-05-04 15:20:39 +00:00
initial_mm.bss_start = (uint64_t)&_bss;
initial_mm.bss_end = (uint64_t)&_ebss;
2022-05-06 07:29:42 +00:00
initial_mm.brk_start = memory_management_struct.start_brk;
initial_mm.brk_end = current_pcb->addr_limit;
2022-04-13 09:58:06 +00:00
initial_mm.stack_start = _stack_start;
2022-04-14 08:53:11 +00:00
2022-04-13 09:58:06 +00:00
initial_tss[proc_current_cpu_id].rsp0 = initial_thread.rbp;
2022-05-04 15:20:39 +00:00
// ========= 在IDLE进程的顶层页表中添加对内核地址空间的映射 =====================
// 由于IDLE进程的顶层页表的高地址部分会被后续进程所复制为了使所有进程能够共享相同的内核空间
// 因此需要先在IDLE进程的顶层页表内映射二级页表
uint64_t *idle_pml4t_vaddr = (uint64_t *)phys_2_virt((uint64_t)get_CR3() & (~0xfffUL));
for (int i = 256; i < 512; ++i)
{
uint64_t *tmp = idle_pml4t_vaddr + i;
barrier();
if (*tmp == 0)
2022-05-04 15:20:39 +00:00
{
void *pdpt = kmalloc(PAGE_4K_SIZE, 0);
barrier();
2022-05-04 15:20:39 +00:00
memset(pdpt, 0, PAGE_4K_SIZE);
barrier();
2022-05-04 15:20:39 +00:00
set_pml4t(tmp, mk_pml4t(virt_2_phys(pdpt), PAGE_KERNEL_PGT));
}
}
barrier();
flush_tlb();
/*
kdebug("initial_thread.rbp=%#018lx", initial_thread.rbp);
kdebug("initial_tss[0].rsp1=%#018lx", initial_tss[0].rsp1);
kdebug("initial_tss[0].ist1=%#018lx", initial_tss[0].ist1);
*/
2022-05-04 15:20:39 +00:00
// 初始化pid的写锁
2022-05-04 15:20:39 +00:00
spin_init(&process_global_pid_write_lock);
// 初始化进程的循环链表
list_init(&initial_proc_union.pcb.list);
barrier();
2022-07-26 07:44:01 +00:00
kernel_thread(initial_kernel_thread, 10, CLONE_FS | CLONE_SIGNAL); // 初始化内核线程
barrier();
initial_proc_union.pcb.state = PROC_RUNNING;
2022-04-13 03:14:49 +00:00
initial_proc_union.pcb.preempt_count = 0;
2022-05-04 15:20:39 +00:00
initial_proc_union.pcb.cpu_id = 0;
initial_proc_union.pcb.virtual_runtime = (1UL << 60);
current_pcb->virtual_runtime = (1UL << 60);
}
/**
* @brief fork当前进程
*
* @param regs
* @param clone_flags
* @param stack_start
* @param stack_size
* @return unsigned long
*/
unsigned long do_fork(struct pt_regs *regs, unsigned long clone_flags, unsigned long stack_start, unsigned long stack_size)
{
2022-05-04 15:20:39 +00:00
int retval = 0;
struct process_control_block *tsk = NULL;
2022-05-04 15:20:39 +00:00
// 为新的进程分配栈空间并将pcb放置在底部
tsk = (struct process_control_block *)kmalloc(STACK_SIZE, 0);
barrier();
2022-05-04 15:20:39 +00:00
if (tsk == NULL)
{
retval = -ENOMEM;
return retval;
}
barrier();
2022-05-04 15:20:39 +00:00
memset(tsk, 0, sizeof(struct process_control_block));
io_mfence();
// 将当前进程的pcb复制到新的pcb内
2022-05-04 15:20:39 +00:00
memcpy(tsk, current_pcb, sizeof(struct process_control_block));
io_mfence();
2022-04-14 08:53:11 +00:00
2022-08-01 03:34:06 +00:00
// 初始化进程的循环链表结点
list_init(&tsk->list);
io_mfence();
2022-08-01 03:34:06 +00:00
// 判断是否为内核态调用fork
if (current_pcb->flags & PF_KTHREAD && stack_start != 0)
tsk->flags |= PF_KFORK;
tsk->priority = 2;
2022-04-13 03:14:49 +00:00
tsk->preempt_count = 0;
2022-05-04 15:20:39 +00:00
// 增加全局的pid并赋值给新进程的pid
spin_lock(&process_global_pid_write_lock);
tsk->pid = process_global_pid++;
barrier();
2022-05-04 15:20:39 +00:00
// 加入到进程链表中
tsk->next_pcb = initial_proc_union.pcb.next_pcb;
barrier();
2022-05-04 15:20:39 +00:00
initial_proc_union.pcb.next_pcb = tsk;
barrier();
2022-05-04 15:20:39 +00:00
tsk->parent_pcb = current_pcb;
barrier();
2022-05-04 15:20:39 +00:00
spin_unlock(&process_global_pid_write_lock);
2022-04-13 09:58:06 +00:00
tsk->cpu_id = proc_current_cpu_id;
2022-06-09 16:22:14 +00:00
tsk->state = PROC_UNINTERRUPTIBLE;
2022-05-31 13:55:06 +00:00
tsk->parent_pcb = current_pcb;
wait_queue_init(&tsk->wait_child_proc_exit, NULL);
barrier();
2022-04-12 03:54:44 +00:00
list_init(&tsk->list);
2022-05-04 15:20:39 +00:00
retval = -ENOMEM;
// 拷贝标志位
if (process_copy_flags(clone_flags, tsk))
goto copy_flags_failed;
// 拷贝内存空间分布结构体
if (process_copy_mm(clone_flags, tsk))
goto copy_mm_failed;
// 拷贝文件
if (process_copy_files(clone_flags, tsk))
goto copy_files_failed;
// 拷贝线程结构体
if (process_copy_thread(clone_flags, tsk, stack_start, stack_size, regs))
goto copy_thread_failed;
// 拷贝成功
retval = tsk->pid;
2022-05-31 13:55:06 +00:00
2022-08-01 03:34:06 +00:00
tsk->flags &= ~PF_KFORK;
2022-05-04 15:20:39 +00:00
// 唤醒进程
process_wakeup(tsk);
return retval;
copy_thread_failed:;
// 回收线程
process_exit_thread(tsk);
copy_files_failed:;
// 回收文件
process_exit_files(tsk);
copy_mm_failed:;
// 回收内存空间分布结构体
process_exit_mm(tsk);
copy_flags_failed:;
kfree(tsk);
return retval;
return 0;
}
2022-05-04 15:20:39 +00:00
/**
* @brief pid获取进程的pcb
*
* @param pid
* @return struct process_control_block*
*/
struct process_control_block *process_get_pcb(long pid)
{
struct process_control_block *pcb = initial_proc_union.pcb.next_pcb;
// 使用蛮力法搜索指定pid的pcb
// todo: 使用哈希表来管理pcb
for (; pcb != &initial_proc_union.pcb; pcb = pcb->next_pcb)
{
if (pcb->pid == pid)
return pcb;
}
return NULL;
}
/**
* @brief
*
* @param pcb pcb
*/
void process_wakeup(struct process_control_block *pcb)
2022-07-12 04:01:51 +00:00
{
pcb->state = PROC_RUNNING;
sched_cfs_enqueue(pcb);
}
/**
* @brief
*
* @param pcb pcb
*/
void process_wakeup_immediately(struct process_control_block *pcb)
2022-05-04 15:20:39 +00:00
{
pcb->state = PROC_RUNNING;
sched_cfs_enqueue(pcb);
// 将当前进程标志为需要调度缩短新进程被wakeup的时间
current_pcb->flags |= PF_NEED_SCHED;
2022-05-04 15:20:39 +00:00
}
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_flags(uint64_t clone_flags, struct process_control_block *pcb)
{
if (clone_flags & CLONE_VM)
pcb->flags |= PF_VFORK;
return 0;
}
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_files(uint64_t clone_flags, struct process_control_block *pcb)
{
int retval = 0;
// 如果CLONE_FS被置位那么子进程与父进程共享文件描述符
// 文件描述符已经在复制pcb时被拷贝
if (clone_flags & CLONE_FS)
return retval;
// 为新进程拷贝新的文件描述符
for (int i = 0; i < PROC_MAX_FD_NUM; ++i)
{
if (current_pcb->fds[i] == NULL)
continue;
pcb->fds[i] = (struct vfs_file_t *)kmalloc(sizeof(struct vfs_file_t), 0);
memcpy(pcb->fds[i], current_pcb->fds[i], sizeof(struct vfs_file_t));
}
return retval;
}
/**
* @brief
*
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_exit_files(struct process_control_block *pcb)
{
// 不与父进程共享文件描述符
if (!(pcb->flags & PF_VFORK))
2022-05-04 15:20:39 +00:00
{
for (int i = 0; i < PROC_MAX_FD_NUM; ++i)
{
if (pcb->fds[i] == NULL)
continue;
kfree(pcb->fds[i]);
}
2022-05-04 15:20:39 +00:00
}
// 清空当前进程的文件描述符列表
2022-05-04 15:20:39 +00:00
memset(pcb->fds, 0, sizeof(struct vfs_file_t *) * PROC_MAX_FD_NUM);
}
/**
* @brief
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_mm(uint64_t clone_flags, struct process_control_block *pcb)
{
int retval = 0;
// 与父进程共享内存空间
if (clone_flags & CLONE_VM)
{
pcb->mm = current_pcb->mm;
2022-05-04 15:20:39 +00:00
return retval;
}
// 分配新的内存空间分布结构体
struct mm_struct *new_mms = (struct mm_struct *)kmalloc(sizeof(struct mm_struct), 0);
memset(new_mms, 0, sizeof(struct mm_struct));
memcpy(new_mms, current_pcb->mm, sizeof(struct mm_struct));
pcb->mm = new_mms;
// 分配顶层页表, 并设置顶层页表的物理地址
new_mms->pgd = (pml4t_t *)virt_2_phys(kmalloc(PAGE_4K_SIZE, 0));
// 由于高2K部分为内核空间在接下来需要覆盖其数据因此不用清零
memset(phys_2_virt(new_mms->pgd), 0, PAGE_4K_SIZE / 2);
2022-05-04 15:20:39 +00:00
// 拷贝内核空间的页表指针
2022-05-06 03:44:53 +00:00
memcpy(phys_2_virt(new_mms->pgd) + 256, phys_2_virt(initial_proc[proc_current_cpu_id]->mm->pgd) + 256, PAGE_4K_SIZE / 2);
2022-05-04 15:20:39 +00:00
2022-05-06 03:44:53 +00:00
uint64_t *current_pgd = (uint64_t *)phys_2_virt(current_pcb->mm->pgd);
2022-05-04 15:20:39 +00:00
2022-05-06 03:44:53 +00:00
uint64_t *new_pml4t = (uint64_t *)phys_2_virt(new_mms->pgd);
2022-05-04 15:20:39 +00:00
// 迭代地拷贝用户空间
for (int i = 0; i <= 255; ++i)
{
// 当前页表项为空
2022-05-06 03:44:53 +00:00
if ((*(uint64_t *)(current_pgd + i)) == 0)
2022-05-04 15:20:39 +00:00
continue;
2022-06-07 15:18:26 +00:00
2022-05-04 15:20:39 +00:00
// 分配新的二级页表
2022-06-02 06:20:53 +00:00
uint64_t *new_pdpt = (uint64_t *)kmalloc(PAGE_4K_SIZE, 0);
2022-05-04 15:20:39 +00:00
memset(new_pdpt, 0, PAGE_4K_SIZE);
2022-05-06 03:44:53 +00:00
2022-05-04 15:20:39 +00:00
// 在新的一级页表中设置新的二级页表表项
2022-05-06 03:44:53 +00:00
set_pml4t(new_pml4t + i, mk_pml4t(virt_2_phys(new_pdpt), (*(current_pgd + i)) & 0xfffUL));
2022-05-04 15:20:39 +00:00
2022-06-02 06:20:53 +00:00
uint64_t *current_pdpt = (uint64_t *)phys_2_virt((*(uint64_t *)(current_pgd + i)) & (~0xfffUL));
2022-06-07 15:18:26 +00:00
// kdebug("current_pdpt=%#018lx, current_pid=%d", current_pdpt, current_pcb->pid);
2022-05-04 15:20:39 +00:00
for (int j = 0; j < 512; ++j)
{
2022-06-02 06:20:53 +00:00
if (*(current_pdpt + j) == 0)
2022-05-04 15:20:39 +00:00
continue;
2022-05-06 03:44:53 +00:00
2022-05-04 15:20:39 +00:00
// 分配新的三级页表
2022-06-02 06:20:53 +00:00
uint64_t *new_pdt = (uint64_t *)kmalloc(PAGE_4K_SIZE, 0);
2022-05-04 15:20:39 +00:00
memset(new_pdt, 0, PAGE_4K_SIZE);
2022-06-02 06:20:53 +00:00
// 在二级页表中填写新的三级页表
2022-05-04 15:20:39 +00:00
// 在新的二级页表中设置三级页表的表项
2022-06-02 06:20:53 +00:00
set_pdpt((uint64_t *)(new_pdpt + j), mk_pdpt(virt_2_phys(new_pdt), (*(current_pdpt + j)) & 0xfffUL));
2022-05-04 15:20:39 +00:00
2022-06-02 06:20:53 +00:00
uint64_t *current_pdt = (uint64_t *)phys_2_virt((*(current_pdpt + j)) & (~0xfffUL));
2022-06-07 15:18:26 +00:00
// kdebug("current_pdt=%#018lx", current_pdt);
2022-06-02 06:20:53 +00:00
// 循环拷贝三级页表
2022-05-04 15:20:39 +00:00
for (int k = 0; k < 512; ++k)
{
2022-06-02 06:20:53 +00:00
if (*(current_pdt + k) == 0)
continue;
// 获取新的物理页
2022-06-02 06:20:53 +00:00
uint64_t pa = alloc_pages(ZONE_NORMAL, 1, PAGE_PGT_MAPPED)->addr_phys;
memset((void *)phys_2_virt(pa), 0, PAGE_2M_SIZE);
2022-06-02 06:20:53 +00:00
set_pdt((uint64_t *)(new_pdt + k), mk_pdt(pa, *(current_pdt + k) & 0x1ffUL));
2022-06-02 06:20:53 +00:00
// 拷贝数据
memcpy(phys_2_virt(pa), phys_2_virt((*(current_pdt + k)) & (~0x1ffUL)), PAGE_2M_SIZE);
2022-05-04 15:20:39 +00:00
}
}
}
return retval;
}
/**
* @brief
*
* @param pcb
* @return uint64_t
*/
uint64_t process_exit_mm(struct process_control_block *pcb)
{
if (pcb->flags & CLONE_VM)
return 0;
if (pcb->mm == NULL)
{
kdebug("pcb->mm==NULL");
return 0;
}
if (pcb->mm->pgd == NULL)
{
kdebug("pcb->mm->pgd==NULL");
return 0;
}
// 获取顶层页表
pml4t_t *current_pgd = (pml4t_t *)phys_2_virt(pcb->mm->pgd);
// 迭代地释放用户空间
for (int i = 0; i <= 255; ++i)
{
// 当前页表项为空
if ((current_pgd + i)->pml4t == 0)
continue;
// 二级页表entry
pdpt_t *current_pdpt = (pdpt_t *)phys_2_virt((current_pgd + i)->pml4t & (~0xfffUL));
// 遍历二级页表
for (int j = 0; j < 512; ++j)
{
if ((current_pdpt + j)->pdpt == 0)
continue;
// 三级页表的entry
pdt_t *current_pdt = (pdt_t *)phys_2_virt((current_pdpt + j)->pdpt & (~0xfffUL));
// 释放三级页表的内存页
for (int k = 0; k < 512; ++k)
{
if ((current_pdt + k)->pdt == 0)
continue;
2022-07-18 08:07:34 +00:00
// 存在4级页表
if (unlikely(((current_pdt + k)->pdt & (1 << 7)) == 0))
{
// 存在4K页
uint64_t *pt_ptr = (uint64_t *)phys_2_virt((current_pdt + k)->pdt & (~0x1fffUL));
uint64_t *pte_ptr = pt_ptr;
// 循环处理4K页表, 直接清空
// todo: 当支持使用slab分配4K内存作为进程的4K页之后在这里需要释放这些4K对象
for (int16_t g = 0; g < 512; ++g, ++pte_ptr)
*pte_ptr = 0;
// 4级页表已经空了释放页表
if (unlikely(mm_check_page_table(pt_ptr)) == 0)
kfree(pt_ptr);
}
else
{
// 释放内存页
if (mm_is_2M_page((current_pdt + k)->pdt & (~0x1fffUL))) // 校验是否为内存中的物理页
free_pages(Phy_to_2M_Page((current_pdt + k)->pdt & (~0x1fffUL)), 1);
}
2022-05-04 15:20:39 +00:00
}
// 释放三级页表
kfree(current_pdt);
}
// 释放二级页表
kfree(current_pdpt);
}
// 释放顶层页表
kfree(current_pgd);
// 释放内存空间分布结构体
kfree(pcb->mm);
return 0;
}
2022-08-01 03:34:06 +00:00
/**
* @brief rbp地址
*
* @param new_regs reg
* @param new_pcb pcb
* @return int
*/
static int process_rewrite_rbp(struct pt_regs *new_regs, struct process_control_block *new_pcb)
{
uint64_t new_top = ((uint64_t)new_pcb) + STACK_SIZE;
uint64_t old_top = (uint64_t)(current_pcb) + STACK_SIZE;
uint64_t *rbp = &new_regs->rbp;
uint64_t *tmp = rbp;
// 超出内核栈范围
if ((uint64_t)*rbp >= old_top || (uint64_t)*rbp < (old_top - STACK_SIZE))
return 0;
while (1)
{
// 计算delta
uint64_t delta = old_top - *rbp;
// 计算新的rbp值
uint64_t newVal = new_top - delta;
// 新的值不合法
if (unlikely((uint64_t)newVal >= new_top || (uint64_t)newVal < (new_top - STACK_SIZE)))
break;
// 将新的值写入对应位置
*rbp = newVal;
// 跳转栈帧
rbp = (uint64_t *)*rbp;
}
// 设置内核态fork返回到enter_syscall_int()函数内的时候rsp寄存器的值
new_regs->rsp = new_top - (old_top - new_regs->rsp);
return 0;
}
2022-05-04 15:20:39 +00:00
/**
* @brief 线
*
* @param clone_flags
* @param pcb pcb
* @return uint64_t
*/
uint64_t process_copy_thread(uint64_t clone_flags, struct process_control_block *pcb, uint64_t stack_start, uint64_t stack_size, struct pt_regs *current_regs)
{
// 将线程结构体放置在pcb后方
struct thread_struct *thd = (struct thread_struct *)(pcb + 1);
memset(thd, 0, sizeof(struct thread_struct));
pcb->thread = thd;
2022-08-01 03:34:06 +00:00
struct pt_regs *child_regs = NULL;
2022-05-04 15:20:39 +00:00
// 拷贝栈空间
2022-08-01 03:34:06 +00:00
if (pcb->flags & PF_KFORK) // 内核态下的fork
{
// 内核态下则拷贝整个内核栈
uint32_t size = ((uint64_t)current_pcb) + STACK_SIZE - (uint64_t)(current_regs);
child_regs = (struct pt_regs *)(((uint64_t)pcb) + STACK_SIZE - size);
memcpy(child_regs, (void *)current_regs, size);
barrier();
2022-08-01 03:34:06 +00:00
// 然后重写新的栈中每个栈帧的rbp值
process_rewrite_rbp(child_regs, pcb);
}
else
{
child_regs = (struct pt_regs *)((uint64_t)pcb + STACK_SIZE - sizeof(struct pt_regs));
memcpy(child_regs, current_regs, sizeof(struct pt_regs));
barrier();
2022-08-01 03:34:06 +00:00
child_regs->rsp = stack_start;
}
2022-05-04 15:20:39 +00:00
// 设置子进程的返回值为0
2022-05-04 15:20:39 +00:00
child_regs->rax = 0;
2022-08-01 03:34:06 +00:00
if (pcb->flags & PF_KFORK)
thd->rbp = (uint64_t)(child_regs + 1); // 设置新的内核线程开始执行时的rbp也就是进入ret_from_system_call时的rbp
else
thd->rbp = (uint64_t)pcb + STACK_SIZE;
2022-05-04 15:20:39 +00:00
2022-08-01 03:34:06 +00:00
// 设置新的内核线程开始执行的时候的rsp
2022-05-04 15:20:39 +00:00
thd->rsp = (uint64_t)child_regs;
thd->fs = current_pcb->thread->fs;
thd->gs = current_pcb->thread->gs;
2022-08-01 03:34:06 +00:00
// 根据是否为内核线程、是否在内核态fork设置进程的开始执行的地址
if (pcb->flags & PF_KFORK)
thd->rip = (uint64_t)ret_from_system_call;
else if (pcb->flags & PF_KTHREAD && (!(pcb->flags & PF_KFORK)))
2022-05-04 15:20:39 +00:00
thd->rip = (uint64_t)kernel_thread_func;
else
thd->rip = (uint64_t)ret_from_system_call;
2022-08-01 03:34:06 +00:00
2022-05-04 15:20:39 +00:00
return 0;
}
/**
* @brief todo: 线
*
* @param pcb
*/
void process_exit_thread(struct process_control_block *pcb)
{
2022-08-01 11:43:21 +00:00
}
// #pragma GCC pop_options