init/main.c

时间:2023-12-11 19:55:02

/*
* linux/init/main.c
*
* Copyright (C) 1991, 1992 Linus Torvalds
*/

#include <stdarg.h>

#include <asm/system.h>
#include <asm/io.h>

#include <linux/types.h>
#include <linux/fcntl.h>
#include <linux/config.h>
#include <linux/sched.h>
#include <linux/tty.h>
#include <linux/head.h>
#include <linux/unistd.h>
#include <linux/string.h>
#include <linux/timer.h>
#include <linux/fs.h>
#include <linux/ctype.h>
#include <linux/delay.h>
#include <linux/utsname.h>
#include <linux/ioport.h>

extern unsigned long * prof_buffer;
extern unsigned long prof_len;
extern char edata, end;
extern char *linux_banner;
//此函数在sys_call.s文件中
asmlinkage void lcall7(void);
struct desc_struct default_ldt;

/*
* we need this inline - forking from kernel space will result
* in NO COPY ON WRITE (!!!), until an execve is executed. This
* is no problem, but for the stack. This is handled by not letting
* main() use the stack at all after fork(). Thus, no function
* calls - which means inline code for fork too, as otherwise we
* would use the stack upon exit from 'fork()'.
*
* Actually only pause and fork are needed inline, so that there
* won't be any messing with the stack from main(), but we define
* some others too.
*/
#define __NR__exit __NR_exit
static inline _syscall0(int,idle)
static inline _syscall0(int,fork)
static inline _syscall0(int,pause)
static inline _syscall1(int,setup,void *,BIOS)
static inline _syscall0(int,sync)
static inline _syscall0(pid_t,setsid)
static inline _syscall3(int,write,int,fd,const char *,buf,off_t,count)
static inline _syscall1(int,dup,int,fd)
static inline _syscall3(int,execve,const char *,file,char **,argv,char **,envp)
static inline _syscall3(int,open,const char *,file,int,flag,int,mode)
static inline _syscall1(int,close,int,fd)
static inline _syscall1(int,_exit,int,exitcode)
static inline _syscall3(pid_t,waitpid,pid_t,pid,int *,wait_stat,int,options)

static inline pid_t wait(int * wait_stat)
{
return waitpid(-1,wait_stat,0);
}

static char printbuf[1024];

//控制台日志级别
extern int console_loglevel;

//零页
extern char empty_zero_page[PAGE_SIZE];
extern int vsprintf(char *,const char *,va_list);
extern void init(void);
extern void init_IRQ(void);
extern long kmalloc_init (long,long);
extern long blk_dev_init(long,long);
extern long chr_dev_init(long,long);
extern void floppy_init(void);
extern void sock_init(void);
extern long rd_init(long mem_start, int length);
unsigned long net_dev_init(unsigned long, unsigned long);
extern unsigned long simple_strtoul(const char *,char **,unsigned int);

extern void hd_setup(char *str, int *ints);
extern void bmouse_setup(char *str, int *ints);
extern void eth_setup(char *str, int *ints);
extern void xd_setup(char *str, int *ints);
extern void mcd_setup(char *str, int *ints);
extern void st0x_setup(char *str, int *ints);
extern void tmc8xx_setup(char *str, int *ints);
extern void t128_setup(char *str, int *ints);
extern void generic_NCR5380_setup(char *str, int *intr);
extern void aha152x_setup(char *str, int *ints);
extern void sound_setup(char *str, int *ints);
#ifdef CONFIG_SBPCD
extern void sbpcd_setup(char *str, int *ints);
#endif CONFIG_SBPCD

#ifdef CONFIG_SYSVIPC
extern void ipc_init(void);
#endif
#ifdef CONFIG_SCSI
extern unsigned long scsi_dev_init(unsigned long, unsigned long);
#endif

/*
* This is set up by the setup-routine at boot-time
*/
#define PARAM empty_zero_page
#define EXT_MEM_K (*(unsigned short *) (PARAM+2))
#define DRIVE_INFO (*(struct drive_info_struct *) (PARAM+0x80))
#define SCREEN_INFO (*(struct screen_info *) (PARAM+0))
#define MOUNT_ROOT_RDONLY (*(unsigned short *) (PARAM+0x1F2))
#define RAMDISK_SIZE (*(unsigned short *) (PARAM+0x1F8))
#define ORIG_ROOT_DEV (*(unsigned short *) (PARAM+0x1FC))
#define AUX_DEVICE_INFO (*(unsigned char *) (PARAM+0x1FF))

/*
* Boot command-line arguments
*/
#define MAX_INIT_ARGS 8
#define MAX_INIT_ENVS 8
#define COMMAND_LINE ((char *) (PARAM+2048))

extern void time_init(void);

static unsigned long memory_start = 0; /* After mem_init, stores the */
/* amount of free user memory */
static unsigned long memory_end = 0;
static unsigned long low_memory_start = 0;

static char term[21];
int rows, cols;

static char * argv_init[MAX_INIT_ARGS+2] = { "init", NULL, };
static char * envp_init[MAX_INIT_ENVS+2] = { "HOME=/", term, NULL, };

static char * argv_rc[] = { "/bin/sh", NULL };
static char * envp_rc[] = { "HOME=/", term, NULL };

static char * argv[] = { "-/bin/sh",NULL };
static char * envp[] = { "HOME=/usr/root", term, NULL };

struct drive_info_struct { char dummy[32]; } drive_info;
struct screen_info screen_info;

unsigned char aux_device_present;
int ramdisk_size;
int root_mountflags = 0;

static char fpu_error = 0;

static char command_line[80] = { 0, };

char *get_options(char *str, int *ints)
{
char *cur = str;
int i=1;

while (cur && isdigit(*cur) && i <= 10) {
ints[i++] = simple_strtoul(cur,NULL,0);
if ((cur = strchr(cur,',')) != NULL)
cur++;
}
ints[0] = i-1;
return(cur);
}

struct {
char *str;
void (*setup_func)(char *, int *);
} bootsetups[] = {
{ "reserve=", reserve_setup },
#ifdef CONFIG_INET
{ "ether=", eth_setup },
#endif
#ifdef CONFIG_BLK_DEV_HD
{ "hd=", hd_setup },
#endif
#ifdef CONFIG_BUSMOUSE
{ "bmouse=", bmouse_setup },
#endif
#ifdef CONFIG_SCSI_SEAGATE
{ "st0x=", st0x_setup },
{ "tmc8xx=", tmc8xx_setup },
#endif
#ifdef CONFIG_SCSI_T128
{ "t128=", t128_setup },
#endif
#ifdef CONFIG_SCSI_GENERIC_NCR5380
{ "ncr5380=", generic_NCR5380_setup },
#endif
#ifdef CONFIG_SCSI_AHA152X
{ "aha152x=", aha152x_setup},
#endif
#ifdef CONFIG_BLK_DEV_XD
{ "xd=", xd_setup },
#endif
#ifdef CONFIG_MCD
{ "mcd=", mcd_setup },
#endif
#ifdef CONFIG_SOUND
{ "sound=", sound_setup },
#endif
#ifdef CONFIG_SBPCD
{ "sbpcd=", sbpcd_setup },
#endif CONFIG_SBPCD
{ 0, 0 }
};

//检测设置,根据命令行中的命令,调整设置,实际上是设置各种设备的初始化函数
int checksetup(char *line)
{
int i = 0;
int ints[11];

//遍历数组
while (bootsetups[i].str) {
//所遍历到的项的字符串长度
int n = strlen(bootsetups[i].str);
//和给定的内容进行比较
if (!strncmp(line,bootsetups[i].str,n)) {
//如果相同,则调整挂接的设置函数
bootsetups[i].setup_func(get_options(line+n,ints), ints);
return(0);
}
i++;
}
return(1);
}

unsigned long loops_per_sec = 1;
//延迟校准
static void calibrate_delay(void)
{
int ticks;

printk("Calibrating delay loop.. ");
while (loops_per_sec <<= 1) {
ticks = jiffies;
__delay(loops_per_sec);
ticks = jiffies - ticks;
if (ticks >= HZ) {
__asm__("mull %1 ; divl %2"
:"=a" (loops_per_sec)
:"d" (HZ),
"r" (ticks),
"0" (loops_per_sec)
:"dx");
printk("ok - %lu.%02lu BogoMips\n",
loops_per_sec/500000,
(loops_per_sec/5000) % 100);
return;
}
}
printk("failed\n");
}

/*
* This is a simple kernel command line parsing function: it parses
* the command line, and fills in the arguments/environment to init
* as appropriate. Any cmd-line option is taken to be an environment
* variable if it contains the character '='.
*
*
* This routine also checks for options meant for the kernel - currently
* only the "root=XXXX" option is recognized. These options are not given
* to init - they are for internal kernel use only.
*/
//这是一个简单的内核命令行解析函数。它解析命令行参数,并且正确的填入init参数环境
static void parse_options(char *line)
{
char *next;
char *devnames[] = { "hda", "hdb", "sda", "sdb", "sdc", "sdd", "sde", "fd", "xda", "xdb", NULL };
int devnums[] = { 0x300, 0x340, 0x800, 0x810, 0x820, 0x830, 0x840, 0x200, 0xC00, 0xC40, 0};
int args, envs;

//校验参数
if (!*line)
return;
//
args = 0;
//终端默认设置为控制台模式
envs = 1; /* TERM is set to 'console' by default */
//next指向输入参数开始抵制
next = line;
//一直解析参数到结尾,分别确定根设备号、读写属性、日志级别,数学协处理器
while ((line = next) != NULL) {
//查找line字符串中的空格,将该位置置0
if ((next = strchr(line,' ')) != NULL)
*next++ = 0;
/*
* check for kernel options first..
*/
//检测内核选项

//首先检测是否有root
if (!strncmp(line,"root=",5)) {
//如果有root
int n;
line += 5;
//是否以"/dev/"开始
if (strncmp(line,"/dev/",5)) {
//如果不是,则直接将字符按16进制转换,作为根设备号
ROOT_DEV = simple_strtoul(line,NULL,16);
continue;
}
//跳过"/dev/"
line += 5;
//
for (n = 0 ; devnames[n] ; n++) {
//设备名称的长度
int len = strlen(devnames[n]);
//查找设备名称
if (!strncmp(line,devnames[n],len)) {
//确定根设备号
ROOT_DEV = devnums[n]+simple_strtoul(line+len,NULL,16);
break;
}
}
} else if (!strcmp(line,"ro")) //如果不是root,则比较是否为ro,即只读
root_mountflags |= MS_RDONLY;
else if (!strcmp(line,"rw")) //是否为rw,即读写
root_mountflags &= ~MS_RDONLY;
else if (!strcmp(line,"debug")) //日志级别
console_loglevel = 10;
else if (!strcmp(line,"no387")) { //是否定义了协处理器
hard_math = 0;
__asm__("movl %%cr0,%%eax\n\t"
"orl $0xE,%%eax\n\t"
"movl %%eax,%%cr0\n\t" : : : "ax");
} else
checksetup(line); //检测设置,重新设置函数
/*
* Then check if it's an environment variable or
* an option.
*/
//检测其它设置
if (strchr(line,'=')) {
if (envs >= MAX_INIT_ENVS)
break;
envp_init[++envs] = line;
} else {
if (args >= MAX_INIT_ARGS)
break;
argv_init[++args] = line;
}
}
argv_init[args+1] = NULL;
envp_init[envs+1] = NULL;
}

//如果在命令行中定义了内存的大小的处理方法,将from内容拷贝到to中,不包含内存的大小
static void copy_options(char * to, char * from)
{
//初始化字符变量未空格
char c = ' ';

//循环处理字符串from,搜索mem=字符串,找到定义值
do {
if (c == ' ' && !memcmp("mem=", from, 4))
memory_end = simple_strtoul(from+4, &from, 0);
c = *(to++) = *(from++);
} while (c);
}

//超时处理
static void copro_timeout(void)
{
fpu_error = 1;
timer_table[COPRO_TIMER].expires = jiffies+100;
timer_active |= 1<<COPRO_TIMER;
printk("387 failed: trying to reset\n");
send_sig(SIGFPE, last_task_used_math, 1);
outb_p(0,0xf1);
outb_p(0,0xf0);
}

//入口函数
asmlinkage void start_kernel(void)
{
/*
* Interrupts are still disabled. Do necessary setups, then
* enable them
*/
//挂接lcall7到默认的ldt中
set_call_gate(&default_ldt,lcall7);
//初始的根设备
ROOT_DEV = ORIG_ROOT_DEV;
//驱动器信息
drive_info = DRIVE_INFO;
//屏幕信息
screen_info = SCREEN_INFO;
//辅助设备信息
aux_device_present = AUX_DEVICE_INFO;
//内存结束位置 1M位置 + 扩展内存(k)*1024
memory_end = (1<<20) + (EXT_MEM_K<<10);
//忽略不到4kb大小的内存
memory_end &= PAGE_MASK;
//ramdisk的长度
ramdisk_size = RAMDISK_SIZE;
//拷贝命令行选项,实际上就是看命令行中是否指定内存大小
// 输入参数command_line目前只有空间,COMMAND_LINE为启动参数
copy_options(command_line,COMMAND_LINE);
//内存定义超过16M的处理
#ifdef CONFIG_MAX_16M
if (memory_end > 16*1024*1024)
memory_end = 16*1024*1024;
#endif
//挂接只读根设备的标志
if (MOUNT_ROOT_RDONLY)
root_mountflags |= MS_RDONLY;
//如果内核所占内存超过1M
if ((unsigned long)&end >= (1024*1024)) {
//重新按照实际情况设置核心内存的开始位置
memory_start = (unsigned long) &end;
low_memory_start = PAGE_SIZE;
} else {
//否者设置主存开始处为1M内存处
memory_start = 1024*1024;
low_memory_start = (unsigned long) &end;
}
//这里如此设置,是因为没有超过的话,在1m内存之前还有剩余

//内存低地址开始处对齐
low_memory_start = PAGE_ALIGN(low_memory_start);
//初始内存页
memory_start = paging_init(memory_start,memory_end);

//判断是否为EISA总线
if (strncmp((char*)0x0FFFD9, "EISA", 4) == 0)
EISA_bus = 1;
//初始化陷阱门
trap_init();
//初始化IRQ
init_IRQ();
//任务调度初始化
sched_init();
//解析命令行
parse_options(command_line);
//配置CONFIG_PROFILE的情况下,内存布局
#ifdef CONFIG_PROFILE
prof_buffer = (unsigned long *) memory_start;
prof_len = (unsigned long) &end;
prof_len >>= 2;
memory_start += prof_len * sizeof(unsigned long);
#endif
//初始化lmalloc
memory_start = kmalloc_init(memory_start,memory_end);
//初始化字符设备
memory_start = chr_dev_init(memory_start,memory_end);
//初始化块设备
memory_start = blk_dev_init(memory_start,memory_end);
//开中断
sti();
//延迟
calibrate_delay();
//初始化网络设备
#ifdef CONFIG_INET
memory_start = net_dev_init(memory_start,memory_end);
#endif
//初始化scsi设备
#ifdef CONFIG_SCSI
memory_start = scsi_dev_init(memory_start,memory_end);
#endif
//初始化inode
memory_start = inode_init(memory_start,memory_end);
//初始化文件表
memory_start = file_table_init(memory_start,memory_end);
//内存初始化
mem_init(low_memory_start,memory_start,memory_end);
//高速缓冲区初始化
buffer_init();
//初始化时间
time_init();
//初始化软盘
floppy_init();
//初始化sock
sock_init();
//初始化ipc
#ifdef CONFIG_SYSVIPC
ipc_init();
#endif
sti();

/*
* check if exception 16 works correctly.. This is truly evil
* code: it disables the high 8 interrupts to make sure that
* the irq13 doesn't happen. But as this will lead to a lockup
* if no exception16 arrives, it depends on the fact that the
* high 8 interrupts will be re-enabled by the next timer tick.
* So the irq13 will happen eventually, but the exception 16
* should get there first..
*/
//数学协处理器处理
if (hard_math) {
unsigned short control_word;

printk("Checking 386/387 coupling... ");
timer_table[COPRO_TIMER].expires = jiffies+50;
timer_table[COPRO_TIMER].fn = copro_timeout;
timer_active |= 1<<COPRO_TIMER;
__asm__("clts ; fninit ; fnstcw %0 ; fwait":"=m" (*&control_word));
control_word &= 0xffc0;
__asm__("fldcw %0 ; fwait": :"m" (*&control_word));
outb_p(inb_p(0x21) | (1 << 2), 0x21);
__asm__("fldz ; fld1 ; fdiv %st,%st(1) ; fwait");
timer_active &= ~(1<<COPRO_TIMER);
if (!fpu_error)
printk("Ok, fpu using %s error reporting.\n",
ignore_irq13?"exception 16":"irq13");
}
#ifndef CONFIG_MATH_EMULATION
else {
printk("No coprocessor found and no math emulation present.\n");
printk("Giving up.\n");
for (;;) ;
}
#endif

//
system_utsname.machine[1] = '0' + x86;
printk(linux_banner);

//转到用户空间
move_to_user_mode();
//创建新进程
if (!fork()) /* we count on this going ok */
//init进程
init();
/*
* task[0] is meant to be used as an "idle" task: it may not sleep, but
* it might do some general things like count free pages or it could be
* used to implement a reasonable LRU algorithm for the paging routines:
* anything that can be useful, but shouldn't take time from the real
* processes.
*
* Right now task[0] just does a infinite idle loop.
*/
for(;;)
idle();
}

//打印函数
static int printf(const char *fmt, ...)
{
va_list args;
int i;

va_start(args, fmt);
write(1,printbuf,i=vsprintf(printbuf, fmt, args));
va_end(args);
return i;
}

//init进程
void init(void)
{
int pid,i;

setup((void *) &drive_info);
sprintf(term, "TERM=con%dx%d", ORIG_VIDEO_COLS, ORIG_VIDEO_LINES);
(void) open("/dev/tty1",O_RDWR,0);
(void) dup(0);
(void) dup(0);

execve("/etc/init",argv_init,envp_init);
execve("/bin/init",argv_init,envp_init);
execve("/sbin/init",argv_init,envp_init);
/* if this fails, fall through to original stuff */

if (!(pid=fork())) {
close(0);
if (open("/etc/rc",O_RDONLY,0))
_exit(1);
execve("/bin/sh",argv_rc,envp_rc);
_exit(2);
}
if (pid>0)
while (pid != wait(&i))
/* nothing */;
while (1) {
if ((pid = fork()) < 0) {
printf("Fork failed in init\n\r");
continue;
}
if (!pid) {
close(0);close(1);close(2);
setsid();
(void) open("/dev/tty1",O_RDWR,0);
(void) dup(0);
(void) dup(0);
_exit(execve("/bin/sh",argv,envp));
}
while (1)
if (pid == wait(&i))
break;
printf("\n\rchild %d died with code %04x\n\r",pid,i);
sync();
}
_exit(0);
}