内核源码:linux-2.6.38.8.tar.bz2
目标平台:ARM体系结构
在Linux系统中,进程和线程都使用task_struct结构体来表示,线程只不过是一种特殊(所谓的特殊也不过是在被创建时使用不同的clone标志组合而已)的进程罢了。
内核线程只运行在内核态,只能使用大于PAGE_OFFSET的线性地址空间。
1、进程0
在Linux系统中,只有这个进程是静态分配的。
/* linux-2.6.38.8/arch/arm/kernel/init_task.c */
struct task_struct init_task = INIT_TASK(init_task);
union thread_union init_thread_union __init_task_data =
{ INIT_THREAD_INFO(init_task) };
然后,通过INIT_TASK宏初始化init_task结构体,通过INIT_THREAD_INFO宏初始化thread_info结构体。
/* linux-2.6.38.8/include/linux/init_task.h */
#define INIT_TASK(tsk) \
{ \
.state = 0, \
.stack = &init_thread_info, \
.usage = ATOMIC_INIT(2), \
.flags = PF_KTHREAD, \
.lock_depth = -1, \
.prio = MAX_PRIO-20, \
.static_prio = MAX_PRIO-20, \
.normal_prio = MAX_PRIO-20, \
.policy = SCHED_NORMAL, \
.cpus_allowed = CPU_MASK_ALL, \
.mm = NULL, \
.active_mm = &init_mm, \
.se = { \
.group_node = LIST_HEAD_INIT(tsk.se.group_node), \
}, \
.rt = { \
.run_list = LIST_HEAD_INIT(tsk.rt.run_list), \
.time_slice = HZ, \
.nr_cpus_allowed = NR_CPUS, \
}, \
.tasks = LIST_HEAD_INIT(tsk.tasks), \
INIT_PUSHABLE_TASKS(tsk) \
.ptraced = LIST_HEAD_INIT(tsk.ptraced), \
.ptrace_entry = LIST_HEAD_INIT(tsk.ptrace_entry), \
.real_parent = &tsk, \
.parent = &tsk, \
.children = LIST_HEAD_INIT(tsk.children), \
.sibling = LIST_HEAD_INIT(tsk.sibling), \
.group_leader = &tsk, \
RCU_INIT_POINTER(.real_cred, &init_cred), \
RCU_INIT_POINTER(.cred, &init_cred), \
.comm = "swapper", \
.thread = INIT_THREAD, \
.fs = &init_fs, \
.files = &init_files, \
.signal = &init_signals, \
.sighand = &init_sighand, \
.nsproxy = &init_nsproxy, \
.pending = { \
.list = LIST_HEAD_INIT(tsk.pending.list), \
.signal = {{0}}}, \
.blocked = {{0}}, \
.alloc_lock = __SPIN_LOCK_UNLOCKED(tsk.alloc_lock), \
.journal_info = NULL, \
.cpu_timers = INIT_CPU_TIMERS(tsk.cpu_timers), \
.fs_excl = ATOMIC_INIT(0), \
.pi_lock = __RAW_SPIN_LOCK_UNLOCKED(tsk.pi_lock), \
.timer_slack_ns = 50000, /* 50 usec default slack */ \
.pids = { \
[PIDTYPE_PID] = INIT_PID_LINK(PIDTYPE_PID), \
[PIDTYPE_PGID] = INIT_PID_LINK(PIDTYPE_PGID), \
[PIDTYPE_SID] = INIT_PID_LINK(PIDTYPE_SID), \
}, \
.thread_group = LIST_HEAD_INIT(tsk.thread_group), \
.dirties = INIT_PROP_LOCAL_SINGLE(dirties), \
INIT_IDS \
INIT_PERF_EVENTS(tsk) \
INIT_TRACE_IRQFLAGS \
INIT_LOCKDEP \
INIT_FTRACE_GRAPH \
INIT_TRACE_RECURSION \
INIT_TASK_RCU_PREEMPT(tsk) \
}
/* linux-2.6.38.8/arch/arm/include/asm/thread_info.h */
#define INIT_THREAD_INFO(tsk) \
{ \
.task = &tsk, \
.exec_domain = &default_exec_domain, \
.flags = 0, \
.preempt_count = INIT_PREEMPT_COUNT, \
.addr_limit = KERNEL_DS, \
.cpu_domain = domain_val(DOMAIN_USER, DOMAIN_MANAGER) | \
domain_val(DOMAIN_KERNEL, DOMAIN_MANAGER) | \
domain_val(DOMAIN_IO, DOMAIN_CLIENT), \
.restart_block = { \
.fn = do_no_restart_syscall, \
}, \
}
2、进程1和kthreadd内核线程
/* linux-2.6.38.8/init/main.c */
kernel_thread(kernel_init, NULL, CLONE_FS | CLONE_SIGHAND);
pid = kernel_thread(kthreadd, NULL, CLONE_FS | CLONE_FILES);
kthreadd_task = find_task_by_pid_ns(pid, &init_pid_ns);
/* linux-2.6.38.8/arch/arm/kernel/process.c */
pid_t kernel_thread(int (*fn)(void *), void *arg, unsigned long flags)
{
struct pt_regs regs;
memset(®s, 0, sizeof(regs));
regs.ARM_r4 = (unsigned long)arg;
regs.ARM_r5 = (unsigned long)fn;
regs.ARM_r6 = (unsigned long)kernel_thread_exit;
regs.ARM_r7 = SVC_MODE | PSR_ENDSTATE | PSR_ISETSTATE;
regs.ARM_pc = (unsigned long)kernel_thread_helper;
regs.ARM_cpsr = regs.ARM_r7 | PSR_I_BIT;
return do_fork(flags|CLONE_VM|CLONE_UNTRACED, 0, ®s, 0, NULL, NULL);
}
当创建的进程被调度时,就会执行fn所指向的函数,参数arg用来给fn所指向的函数传递参数。参数flags用来保存传递给do_fork函数的clone标志。
内核线程kthreadd用来创建其它的内核线程。在Ubuntu 11.04中,所有其它的内核线程的父进程都是此线程。
$ ps -ef | grep "00 \[.*\]$" //在这里,内核线程都用中括号括起来以示区别
root 2 0 0 12:48 ? 00:00:00 [kthreadd]
root 3 2 0 12:48 ? 00:00:00 [ksoftirqd/0]
root 4 2 0 12:48 ? 00:00:00 [kworker/0:0]
root 6 2 0 12:48 ? 00:00:00 [migration/0]
root 7 2 0 12:48 ? 00:00:00 [cpuset]
root 8 2 0 12:48 ? 00:00:00 [khelper]
root 9 2 0 12:48 ? 00:00:00 [netns]
root 10 2 0 12:48 ? 00:00:00 [sync_supers]
root 11 2 0 12:48 ? 00:00:00 [bdi-default]
root 12 2 0 12:48 ? 00:00:00 [kintegrityd]
root 13 2 0 12:48 ? 00:00:00 [kblockd]
root 14 2 0 12:48 ? 00:00:00 [kacpid]
root 15 2 0 12:48 ? 00:00:00 [kacpi_notify]
root 16 2 0 12:48 ? 00:00:00 [kacpi_hotplug]
root 17 2 0 12:48 ? 00:00:00 [ata_sff]
root 18 2 0 12:48 ? 00:00:00 [khubd]
root 19 2 0 12:48 ? 00:00:00 [md]
root 22 2 0 12:48 ? 00:00:00 [khungtaskd]
root 23 2 0 12:48 ? 00:00:00 [kswapd0]
root 24 2 0 12:48 ? 00:00:00 [ksmd]
root 25 2 0 12:48 ? 00:00:00 [fsnotify_mark]
root 26 2 0 12:48 ? 00:00:00 [aio]
root 27 2 0 12:48 ? 00:00:00 [ecryptfs-kthrea]
root 28 2 0 12:48 ? 00:00:00 [crypto]
root 32 2 0 12:48 ? 00:00:00 [kthrotld]
root 34 2 0 12:48 ? 00:00:00 [scsi_eh_0]
root 35 2 0 12:48 ? 00:00:00 [scsi_eh_1]
root 36 2 0 12:48 ? 00:00:00 [kworker/u:3]
root 38 2 0 12:48 ? 00:00:00 [kworker/0:2]
root 39 2 0 12:48 ? 00:00:00 [kmpathd]
root 40 2 0 12:48 ? 00:00:00 [kmpath_handlerd]
root 41 2 0 12:48 ? 00:00:00 [kondemand]
root 42 2 0 12:48 ? 00:00:00 [kconservative]
root 192 2 0 12:48 ? 00:00:00 [mpt_poll_0]
root 193 2 0 12:48 ? 00:00:00 [mpt/0]
root 194 2 0 12:48 ? 00:00:00 [scsi_eh_2]
root 210 2 0 12:48 ? 00:00:00 [kjournald]
root 448 2 0 12:50 ? 00:00:00 [kpsmoused]
root 486 2 0 12:50 ? 00:00:00 [vmmemctl]
root 642 2 0 12:50 ? 00:00:00 [rpciod]
root 659 2 0 12:50 ? 00:00:00 [nfsiod]
root 703 2 0 12:50 ? 00:00:00 [flush-8:0]
root 876 2 0 12:50 ? 00:00:00 [lockd]
root 877 2 0 12:50 ? 00:00:00 [nfsd4]
root 878 2 0 12:50 ? 00:00:00 [nfsd4_callbacks]
root 879 2 0 12:50 ? 00:00:00 [nfsd]
root 880 2 0 12:50 ? 00:00:00 [nfsd]
root 881 2 0 12:50 ? 00:00:00 [nfsd]
root 882 2 0 12:50 ? 00:00:00 [nfsd]
root 883 2 0 12:50 ? 00:00:00 [nfsd]
root 884 2 0 12:50 ? 00:00:00 [nfsd]
root 885 2 0 12:50 ? 00:00:00 [nfsd]
root 886 2 0 12:50 ? 00:00:00 [nfsd]
其中用来创建其它内核线程的函数如下:
/* linux-2.6.38.8/kernel/kthread.c */
int kthreadd(void *unused)
{
struct task_struct *tsk = current;
/* Setup a clean context for our children to inherit. */
set_task_comm(tsk, "kthreadd");
ignore_signals(tsk);
set_cpus_allowed_ptr(tsk, cpu_all_mask);
set_mems_allowed(node_states[N_HIGH_MEMORY]);
current->flags |= PF_NOFREEZE | PF_FREEZER_NOSIG;
for (;;) {
set_current_state(TASK_INTERRUPTIBLE);
if (list_empty(&kthread_create_list))
schedule();
__set_current_state(TASK_RUNNING);
spin_lock(&kthread_create_lock);
while (!list_empty(&kthread_create_list)) {
struct kthread_create_info *create;
create = list_entry(kthread_create_list.next,
struct kthread_create_info, list);
list_del_init(&create->list);
spin_unlock(&kthread_create_lock);
create_kthread(create);
spin_lock(&kthread_create_lock);
}
spin_unlock(&kthread_create_lock);
}
return 0;
}
kthreadd函数通过死循环不断地检查kthread_create_list链表是否为空,如果不为空,则调用create_kthread函数来创建新的内核线程。
/* linux-2.6.38.8/kernel/kthread.c */
static void create_kthread(struct kthread_create_info *create)
{
int pid;
/* We want our own signal handler (we take no signals by default). */
pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
if (pid < 0) {
create->result = ERR_PTR(pid);
complete(&create->done);
}
}
在Linux内核中,可通过调用kthread_create函数来发起内核线程的创建。
/* linux-2.6.38.8/kernel/kthread.c */
struct task_struct *kthread_create(int (*threadfn)(void *data),
void *data,
const char namefmt[],
...)
{
struct kthread_create_info create;
create.threadfn = threadfn;
create.data = data;
init_completion(&create.done);
spin_lock(&kthread_create_lock);
list_add_tail(&create.list, &kthread_create_list);
spin_unlock(&kthread_create_lock);
wake_up_process(kthreadd_task); //唤醒kthreadd来创建内核线程
wait_for_completion(&create.done); //等待内核线程创建完毕
if (!IS_ERR(create.result)) {
static const struct sched_param param = { .sched_priority = 0 };
va_list args;
va_start(args, namefmt);
vsnprintf(create.result->comm, sizeof(create.result->comm),
namefmt, args);
va_end(args);
/*
* root may have changed our (kthreadd's) priority or CPU mask.
* The kernel thread should not inherit these properties.
*/
sched_setscheduler_nocheck(create.result, SCHED_NORMAL, ¶m);
set_cpus_allowed_ptr(create.result, cpu_all_mask);
}
return create.result;
}