main.c 22.2 KB
Newer Older
Linus Torvalds's avatar
Linus Torvalds committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
/*
 *  linux/init/main.c
 *
 *  Copyright (C) 1991, 1992  Linus Torvalds
 *
 *  GK 2/5/95  -  Changed to support mounting root fs via NFS
 *  Added initrd & change_root: Werner Almesberger & Hans Lermen, Feb '96
 *  Moan early if gcc is old, avoiding bogus kernels - Paul Gortmaker, May '96
 *  Simplified starting of init:  Michael A. Griffith <grif@acm.org> 
 */

#include <linux/types.h>
#include <linux/module.h>
#include <linux/proc_fs.h>
#include <linux/kernel.h>
#include <linux/syscalls.h>
Ingo Molnar's avatar
Ingo Molnar committed
17
#include <linux/stackprotector.h>
Linus Torvalds's avatar
Linus Torvalds committed
18
19
20
21
22
23
24
25
26
27
28
29
30
#include <linux/string.h>
#include <linux/ctype.h>
#include <linux/delay.h>
#include <linux/utsname.h>
#include <linux/ioport.h>
#include <linux/init.h>
#include <linux/smp_lock.h>
#include <linux/initrd.h>
#include <linux/bootmem.h>
#include <linux/tty.h>
#include <linux/gfp.h>
#include <linux/percpu.h>
#include <linux/kmod.h>
Nick Piggin's avatar
Nick Piggin committed
31
#include <linux/vmalloc.h>
Linus Torvalds's avatar
Linus Torvalds committed
32
#include <linux/kernel_stat.h>
33
#include <linux/start_kernel.h>
Linus Torvalds's avatar
Linus Torvalds committed
34
#include <linux/security.h>
35
#include <linux/smp.h>
Linus Torvalds's avatar
Linus Torvalds committed
36
37
38
39
40
41
42
43
#include <linux/workqueue.h>
#include <linux/profile.h>
#include <linux/rcupdate.h>
#include <linux/moduleparam.h>
#include <linux/kallsyms.h>
#include <linux/writeback.h>
#include <linux/cpu.h>
#include <linux/cpuset.h>
44
#include <linux/cgroup.h>
Linus Torvalds's avatar
Linus Torvalds committed
45
#include <linux/efi.h>
46
#include <linux/tick.h>
47
#include <linux/interrupt.h>
48
#include <linux/taskstats_kern.h>
49
#include <linux/delayacct.h>
Linus Torvalds's avatar
Linus Torvalds committed
50
51
52
53
#include <linux/unistd.h>
#include <linux/rmap.h>
#include <linux/mempolicy.h>
#include <linux/key.h>
Adrian Bunk's avatar
Adrian Bunk committed
54
#include <linux/buffer_head.h>
55
#include <linux/page_cgroup.h>
56
#include <linux/debug_locks.h>
57
#include <linux/debugobjects.h>
Ingo Molnar's avatar
Ingo Molnar committed
58
#include <linux/lockdep.h>
59
#include <linux/kmemleak.h>
60
#include <linux/pid_namespace.h>
61
#include <linux/device.h>
62
#include <linux/kthread.h>
63
#include <linux/sched.h>
64
#include <linux/signal.h>
65
#include <linux/idr.h>
66
#include <linux/ftrace.h>
67
#include <linux/async.h>
68
#include <linux/kmemcheck.h>
69
#include <linux/kmemtrace.h>
70
#include <trace/boot.h>
Linus Torvalds's avatar
Linus Torvalds committed
71
72
73
74

#include <asm/io.h>
#include <asm/bugs.h>
#include <asm/setup.h>
75
#include <asm/sections.h>
76
#include <asm/cacheflush.h>
Linus Torvalds's avatar
Linus Torvalds committed
77
78
79
80
81

#ifdef CONFIG_X86_LOCAL_APIC
#include <asm/smp.h>
#endif

82
static int kernel_init(void *);
Linus Torvalds's avatar
Linus Torvalds committed
83
84
85
86
87
88
89
90
91
92
93
94
95

extern void init_IRQ(void);
extern void fork_init(unsigned long);
extern void mca_init(void);
extern void sbus_init(void);
extern void prio_tree_init(void);
extern void radix_tree_init(void);
extern void free_initmem(void);
#ifdef	CONFIG_ACPI
extern void acpi_early_init(void);
#else
static inline void acpi_early_init(void) { }
#endif
96
97
98
#ifndef CONFIG_DEBUG_RODATA
static inline void mark_rodata_ro(void) { }
#endif
Linus Torvalds's avatar
Linus Torvalds committed
99
100
101
102
103

#ifdef CONFIG_TC
extern void tc_init(void);
#endif

104
enum system_states system_state __read_mostly;
Linus Torvalds's avatar
Linus Torvalds committed
105
106
107
108
109
110
111
112
113
114
EXPORT_SYMBOL(system_state);

/*
 * Boot command-line arguments
 */
#define MAX_INIT_ARGS CONFIG_INIT_ENV_ARG_LIMIT
#define MAX_INIT_ENVS CONFIG_INIT_ENV_ARG_LIMIT

extern void time_init(void);
/* Default late time init is NULL. archs can override this later. */
115
void (*__initdata late_time_init)(void);
Linus Torvalds's avatar
Linus Torvalds committed
116
117
extern void softirq_init(void);

118
119
120
121
122
123
/* Untouched command line saved by arch-specific code. */
char __initdata boot_command_line[COMMAND_LINE_SIZE];
/* Untouched saved command line (eg. for /proc) */
char *saved_command_line;
/* Command line for parameter parsing */
static char *static_command_line;
Linus Torvalds's avatar
Linus Torvalds committed
124
125

static char *execute_command;
126
static char *ramdisk_execute_command;
Linus Torvalds's avatar
Linus Torvalds committed
127

Jan Beulich's avatar
Jan Beulich committed
128
#ifdef CONFIG_SMP
Linus Torvalds's avatar
Linus Torvalds committed
129
/* Setup configured maximum number of CPUs to activate */
130
unsigned int __initdata setup_max_cpus = NR_CPUS;
131

Linus Torvalds's avatar
Linus Torvalds committed
132
133
134
135
136
137
138
139
140
141
/*
 * Setup routine for controlling SMP activation
 *
 * Command-line option of "nosmp" or "maxcpus=0" will disable SMP
 * activation entirely (the MPS table probe still happens, though).
 *
 * Command-line option of "maxcpus=<NUM>", where <NUM> is an integer
 * greater than 0, limits the maximum number of CPUs activated in
 * SMP mode to <NUM>.
 */
142
143

void __weak arch_disable_smp_support(void) { }
144

Linus Torvalds's avatar
Linus Torvalds committed
145
146
static int __init nosmp(char *str)
{
147
	setup_max_cpus = 0;
148
149
	arch_disable_smp_support();

Jan Beulich's avatar
Jan Beulich committed
150
	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
151
152
}

Jan Beulich's avatar
Jan Beulich committed
153
early_param("nosmp", nosmp);
Linus Torvalds's avatar
Linus Torvalds committed
154
155
156

static int __init maxcpus(char *str)
{
157
158
	get_option(&str, &setup_max_cpus);
	if (setup_max_cpus == 0)
159
		arch_disable_smp_support();
160
161

	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
162
163
}

Hugh Dickins's avatar
Hugh Dickins committed
164
early_param("maxcpus", maxcpus);
Jan Beulich's avatar
Jan Beulich committed
165
#else
166
const unsigned int setup_max_cpus = NR_CPUS;
Jan Beulich's avatar
Jan Beulich committed
167
168
169
170
171
172
173
174
175
176
177
178
179
#endif

/*
 * If set, this is an indication to the drivers that reset the underlying
 * device before going ahead with the initialization otherwise driver might
 * rely on the BIOS and skip the reset operation.
 *
 * This is useful if kernel is booting in an unreliable environment.
 * For ex. kdump situaiton where previous kernel has crashed, BIOS has been
 * skipped and devices will be in unknown state.
 */
unsigned int reset_devices;
EXPORT_SYMBOL(reset_devices);
Linus Torvalds's avatar
Linus Torvalds committed
180

181
182
183
184
185
186
187
188
static int __init set_reset_devices(char *str)
{
	reset_devices = 1;
	return 1;
}

__setup("reset_devices", set_reset_devices);

Linus Torvalds's avatar
Linus Torvalds committed
189
190
191
192
193
194
195
196
197
static char * argv_init[MAX_INIT_ARGS+2] = { "init", NULL, };
char * envp_init[MAX_INIT_ENVS+2] = { "HOME=/", "TERM=linux", NULL, };
static const char *panic_later, *panic_param;

extern struct obs_kernel_param __setup_start[], __setup_end[];

static int __init obsolete_checksetup(char *line)
{
	struct obs_kernel_param *p;
198
	int had_early_param = 0;
Linus Torvalds's avatar
Linus Torvalds committed
199
200
201
202
203
204

	p = __setup_start;
	do {
		int n = strlen(p->str);
		if (!strncmp(line, p->str, n)) {
			if (p->early) {
205
206
207
208
				/* Already done in parse_early_param?
				 * (Needs exact match on param part).
				 * Keep iterating, as we can have early
				 * params and __setups of same names 8( */
Linus Torvalds's avatar
Linus Torvalds committed
209
				if (line[n] == '\0' || line[n] == '=')
210
					had_early_param = 1;
Linus Torvalds's avatar
Linus Torvalds committed
211
212
213
214
215
216
217
218
219
			} else if (!p->setup_func) {
				printk(KERN_WARNING "Parameter %s is obsolete,"
				       " ignored\n", p->str);
				return 1;
			} else if (p->setup_func(line + n))
				return 1;
		}
		p++;
	} while (p < __setup_end);
220
221

	return had_early_param;
Linus Torvalds's avatar
Linus Torvalds committed
222
223
224
225
226
227
228
229
230
231
232
233
234
}

/*
 * This should be approx 2 Bo*oMips to start (note initial shift), and will
 * still work even if initially too large, it will just take slightly longer
 */
unsigned long loops_per_jiffy = (1<<12);

EXPORT_SYMBOL(loops_per_jiffy);

static int __init debug_kernel(char *str)
{
	console_loglevel = 10;
235
	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
236
237
238
239
240
}

static int __init quiet_kernel(char *str)
{
	console_loglevel = 4;
241
	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
242
243
}

244
245
early_param("debug", debug_kernel);
early_param("quiet", quiet_kernel);
Linus Torvalds's avatar
Linus Torvalds committed
246
247
248
249

static int __init loglevel(char *str)
{
	get_option(&str, &console_loglevel);
250
	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
251
252
}

253
early_param("loglevel", loglevel);
Linus Torvalds's avatar
Linus Torvalds committed
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278

/*
 * Unknown boot options get handed to init, unless they look like
 * failed parameters
 */
static int __init unknown_bootoption(char *param, char *val)
{
	/* Change NUL term back to "=", to make "param" the whole string. */
	if (val) {
		/* param=val or param="val"? */
		if (val == param+strlen(param)+1)
			val[-1] = '=';
		else if (val == param+strlen(param)+2) {
			val[-2] = '=';
			memmove(val-1, val, strlen(val)+1);
			val--;
		} else
			BUG();
	}

	/* Handle obsolete-style parameters */
	if (obsolete_checksetup(param))
		return 0;

	/*
Simon Arlott's avatar
Simon Arlott committed
279
	 * Preemptive maintenance for "why didn't my misspelled command
Linus Torvalds's avatar
Linus Torvalds committed
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
	 * line work?"
	 */
	if (strchr(param, '.') && (!val || strchr(param, '.') < val)) {
		printk(KERN_ERR "Unknown boot option `%s': ignoring\n", param);
		return 0;
	}

	if (panic_later)
		return 0;

	if (val) {
		/* Environment option */
		unsigned int i;
		for (i = 0; envp_init[i]; i++) {
			if (i == MAX_INIT_ENVS) {
				panic_later = "Too many boot env vars at `%s'";
				panic_param = param;
			}
			if (!strncmp(param, envp_init[i], val - param))
				break;
		}
		envp_init[i] = param;
	} else {
		/* Command line option */
		unsigned int i;
		for (i = 0; argv_init[i]; i++) {
			if (i == MAX_INIT_ARGS) {
				panic_later = "Too many boot init vars at `%s'";
				panic_param = param;
			}
		}
		argv_init[i] = param;
	}
	return 0;
}

316
317
318
319
#ifdef CONFIG_DEBUG_PAGEALLOC
int __read_mostly debug_pagealloc_enabled = 0;
#endif

Linus Torvalds's avatar
Linus Torvalds committed
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
static int __init init_setup(char *str)
{
	unsigned int i;

	execute_command = str;
	/*
	 * In case LILO is going to boot us with default command line,
	 * it prepends "auto" before the whole cmdline which makes
	 * the shell think it should execute a script with such name.
	 * So we ignore all arguments entered _before_ init=... [MJ]
	 */
	for (i = 1; i < MAX_INIT_ARGS; i++)
		argv_init[i] = NULL;
	return 1;
}
__setup("init=", init_setup);

337
338
339
340
341
342
343
344
345
346
347
348
static int __init rdinit_setup(char *str)
{
	unsigned int i;

	ramdisk_execute_command = str;
	/* See "auto" comment in init_setup */
	for (i = 1; i < MAX_INIT_ARGS; i++)
		argv_init[i] = NULL;
	return 1;
}
__setup("rdinit=", rdinit_setup);

Linus Torvalds's avatar
Linus Torvalds committed
349
350
351
352
353
354
355
356
357
358
359
360
#ifndef CONFIG_SMP

#ifdef CONFIG_X86_LOCAL_APIC
static void __init smp_init(void)
{
	APIC_init_uniprocessor();
}
#else
#define smp_init()	do { } while (0)
#endif

static inline void setup_per_cpu_areas(void) { }
361
static inline void setup_nr_cpu_ids(void) { }
Linus Torvalds's avatar
Linus Torvalds committed
362
363
364
365
static inline void smp_prepare_cpus(unsigned int maxcpus) { }

#else

366
367
368
369
370
#if NR_CPUS > BITS_PER_LONG
cpumask_t cpu_mask_all __read_mostly = CPU_MASK_ALL;
EXPORT_SYMBOL(cpu_mask_all);
#endif

371
372
373
374
375
376
377
/* Setup number of possible processor ids */
int nr_cpu_ids __read_mostly = NR_CPUS;
EXPORT_SYMBOL(nr_cpu_ids);

/* An arch may set nr_cpu_ids earlier if needed, so this would be redundant */
static void __init setup_nr_cpu_ids(void)
{
Rusty Russell's avatar
Rusty Russell committed
378
	nr_cpu_ids = find_last_bit(cpumask_bits(cpu_possible_mask),NR_CPUS) + 1;
379
380
}

381
#ifndef CONFIG_HAVE_SETUP_PER_CPU_AREA
382
unsigned long __per_cpu_offset[NR_CPUS] __read_mostly;
Linus Torvalds's avatar
Linus Torvalds committed
383
384
385
386
387
388
389

EXPORT_SYMBOL(__per_cpu_offset);

static void __init setup_per_cpu_areas(void)
{
	unsigned long size, i;
	char *ptr;
390
	unsigned long nr_possible_cpus = num_possible_cpus();
Linus Torvalds's avatar
Linus Torvalds committed
391
392

	/* Copy section for each CPU (we discard the original) */
393
394
	size = ALIGN(PERCPU_ENOUGH_ROOM, PAGE_SIZE);
	ptr = alloc_bootmem_pages(size * nr_possible_cpus);
Linus Torvalds's avatar
Linus Torvalds committed
395

396
	for_each_possible_cpu(i) {
Linus Torvalds's avatar
Linus Torvalds committed
397
398
		__per_cpu_offset[i] = ptr - __per_cpu_start;
		memcpy(ptr, __per_cpu_start, __per_cpu_end - __per_cpu_start);
399
		ptr += size;
Linus Torvalds's avatar
Linus Torvalds committed
400
401
	}
}
402
#endif /* CONFIG_HAVE_SETUP_PER_CPU_AREA */
Linus Torvalds's avatar
Linus Torvalds committed
403
404
405
406

/* Called by boot processor to activate the rest. */
static void __init smp_init(void)
{
407
	unsigned int cpu;
Linus Torvalds's avatar
Linus Torvalds committed
408

409
410
411
412
	/*
	 * Set up the current CPU as possible to migrate to.
	 * The other ones will be done by cpu_up/cpu_down()
	 */
413
	set_cpu_active(smp_processor_id(), true);
414

Linus Torvalds's avatar
Linus Torvalds committed
415
	/* FIXME: This should be done in userspace --RR */
416
	for_each_present_cpu(cpu) {
417
		if (num_online_cpus() >= setup_max_cpus)
Linus Torvalds's avatar
Linus Torvalds committed
418
			break;
419
420
		if (!cpu_online(cpu))
			cpu_up(cpu);
Linus Torvalds's avatar
Linus Torvalds committed
421
422
423
424
	}

	/* Any cleanup work */
	printk(KERN_INFO "Brought up %ld CPUs\n", (long)num_online_cpus());
425
	smp_cpus_done(setup_max_cpus);
Linus Torvalds's avatar
Linus Torvalds committed
426
427
428
429
}

#endif

430
431
432
433
434
435
436
437
438
439
440
441
442
443
/*
 * We need to store the untouched command line for future reference.
 * We also need to store the touched command line since the parameter
 * parsing is performed in place, and we should allow a component to
 * store reference of name/value for future reference.
 */
static void __init setup_command_line(char *command_line)
{
	saved_command_line = alloc_bootmem(strlen (boot_command_line)+1);
	static_command_line = alloc_bootmem(strlen (command_line)+1);
	strcpy (saved_command_line, boot_command_line);
	strcpy (static_command_line, command_line);
}

Linus Torvalds's avatar
Linus Torvalds committed
444
445
446
447
448
449
450
451
452
/*
 * We need to finalize in a non-__init function or else race conditions
 * between the root thread and the init thread may cause start_kernel to
 * be reaped by free_initmem before the root thread has proceeded to
 * cpu_idle.
 *
 * gcc-3.4 accidentally inlines this function, so use noinline.
 */

453
static noinline void __init_refok rest_init(void)
Linus Torvalds's avatar
Linus Torvalds committed
454
455
	__releases(kernel_lock)
{
456
457
	int pid;

458
	kernel_thread(kernel_init, NULL, CLONE_FS | CLONE_SIGHAND);
Linus Torvalds's avatar
Linus Torvalds committed
459
	numa_default_policy();
460
	pid = kernel_thread(kthreadd, NULL, CLONE_FS | CLONE_FILES);
Pavel Emelyanov's avatar
Pavel Emelyanov committed
461
	kthreadd_task = find_task_by_pid_ns(pid, &init_pid_ns);
Linus Torvalds's avatar
Linus Torvalds committed
462
	unlock_kernel();
463
464
465

	/*
	 * The boot idle thread must execute schedule()
466
	 * at least once to get things moving:
467
	 */
468
	init_idle_bootup_task(current);
469
	rcu_scheduler_starting();
470
	preempt_enable_no_resched();
471
	schedule();
472
	preempt_disable();
473

474
	/* Call into cpu_idle with preempt disabled */
Linus Torvalds's avatar
Linus Torvalds committed
475
	cpu_idle();
476
}
Linus Torvalds's avatar
Linus Torvalds committed
477
478
479
480
481
482
483

/* Check for early params. */
static int __init do_early_param(char *param, char *val)
{
	struct obs_kernel_param *p;

	for (p = __setup_start; p < __setup_end; p++) {
484
485
486
487
		if ((p->early && strcmp(param, p->str) == 0) ||
		    (strcmp(param, "console") == 0 &&
		     strcmp(p->str, "earlycon") == 0)
		) {
Linus Torvalds's avatar
Linus Torvalds committed
488
489
490
491
492
493
494
495
496
			if (p->setup_func(val) != 0)
				printk(KERN_WARNING
				       "Malformed early option '%s'\n", param);
		}
	}
	/* We accept everything at this stage. */
	return 0;
}

497
498
499
500
501
void __init parse_early_options(char *cmdline)
{
	parse_args("early options", cmdline, NULL, 0, do_early_param);
}

Linus Torvalds's avatar
Linus Torvalds committed
502
503
504
505
506
507
508
509
510
511
/* Arch code calls this early on, or if not, just before other parsing. */
void __init parse_early_param(void)
{
	static __initdata int done = 0;
	static __initdata char tmp_cmdline[COMMAND_LINE_SIZE];

	if (done)
		return;

	/* All fall through to do_early_param. */
512
	strlcpy(tmp_cmdline, boot_command_line, COMMAND_LINE_SIZE);
513
	parse_early_options(tmp_cmdline);
Linus Torvalds's avatar
Linus Torvalds committed
514
515
516
517
518
519
520
	done = 1;
}

/*
 *	Activate the first processor.
 */

521
522
523
524
static void __init boot_cpu_init(void)
{
	int cpu = smp_processor_id();
	/* Mark the boot cpu "present", "online" etc for SMP and UP case */
525
526
527
	set_cpu_online(cpu, true);
	set_cpu_present(cpu, true);
	set_cpu_possible(cpu, true);
528
529
}

530
void __init __weak smp_setup_processor_id(void)
531
532
533
{
}

534
535
536
537
void __init __weak thread_info_cache_init(void)
{
}

Pekka Enberg's avatar
Pekka Enberg committed
538
539
540
541
542
/*
 * Set up kernel memory allocators
 */
static void __init mm_init(void)
{
543
544
545
546
547
	/*
	 * page_cgroup requires countinous pages as memmap
	 * and it's bigger than MAX_ORDER unless SPARSEMEM.
	 */
	page_cgroup_init_flatmem();
Pekka Enberg's avatar
Pekka Enberg committed
548
549
	mem_init();
	kmem_cache_init();
550
	pgtable_cache_init();
Pekka Enberg's avatar
Pekka Enberg committed
551
552
553
	vmalloc_init();
}

Linus Torvalds's avatar
Linus Torvalds committed
554
555
556
557
asmlinkage void __init start_kernel(void)
{
	char * command_line;
	extern struct kernel_param __start___param[], __stop___param[];
558
559
560

	smp_setup_processor_id();

Ingo Molnar's avatar
Ingo Molnar committed
561
562
563
564
565
	/*
	 * Need to run as early as possible, to initialize the
	 * lockdep hash:
	 */
	lockdep_init();
566
	debug_objects_early_init();
567
568
569
570
571
572

	/*
	 * Set up the the initial canary ASAP:
	 */
	boot_init_stack_canary();

573
	cgroup_init_early();
Ingo Molnar's avatar
Ingo Molnar committed
574
575
576

	local_irq_disable();
	early_boot_irqs_off();
Ingo Molnar's avatar
Ingo Molnar committed
577
	early_init_irq_lock_class();
Ingo Molnar's avatar
Ingo Molnar committed
578

Linus Torvalds's avatar
Linus Torvalds committed
579
580
581
582
583
/*
 * Interrupts are still disabled. Do necessary setups, then
 * enable them
 */
	lock_kernel();
584
	tick_init();
585
	boot_cpu_init();
Linus Torvalds's avatar
Linus Torvalds committed
586
	page_address_init();
Alex Riesen's avatar
Alex Riesen committed
587
	printk(KERN_NOTICE "%s", linux_banner);
Linus Torvalds's avatar
Linus Torvalds committed
588
	setup_arch(&command_line);
589
	mm_init_owner(&init_mm, &init_task);
590
	setup_command_line(command_line);
Linus Torvalds's avatar
Linus Torvalds committed
591
	setup_per_cpu_areas();
592
	setup_nr_cpu_ids();
593
	smp_prepare_boot_cpu();	/* arch-specific boot-cpu hooks */
Linus Torvalds's avatar
Linus Torvalds committed
594

595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
	build_all_zonelists();
	page_alloc_init();

	printk(KERN_NOTICE "Kernel command line: %s\n", boot_command_line);
	parse_early_param();
	parse_args("Booting kernel", static_command_line, __start___param,
		   __stop___param - __start___param,
		   &unknown_bootoption);
	/*
	 * These use large bootmem allocations and must precede
	 * kmem_cache_init()
	 */
	pidhash_init();
	vfs_caches_init_early();
	sort_main_extable();
	trap_init();
Pekka Enberg's avatar
Pekka Enberg committed
611
	mm_init();
Linus Torvalds's avatar
Linus Torvalds committed
612
613
614
615
616
617
618
619
620
621
622
	/*
	 * Set up the scheduler prior starting any interrupts (such as the
	 * timer interrupt). Full topology setup happens at smp_init()
	 * time - but meanwhile we still have a functioning scheduler.
	 */
	sched_init();
	/*
	 * Disable preemption - early bootup scheduling is extremely
	 * fragile until we cpu_idle() for the first time.
	 */
	preempt_disable();
623
624
625
626
627
	if (!irqs_disabled()) {
		printk(KERN_WARNING "start_kernel(): bug: interrupts were "
				"enabled *very* early, fixing it\n");
		local_irq_disable();
	}
Linus Torvalds's avatar
Linus Torvalds committed
628
	rcu_init();
629
630
	/* init some links before init_ISA_irqs() */
	early_irq_init();
Linus Torvalds's avatar
Linus Torvalds committed
631
	init_IRQ();
632
	prio_tree_init();
Linus Torvalds's avatar
Linus Torvalds committed
633
	init_timers();
634
	hrtimers_init();
Linus Torvalds's avatar
Linus Torvalds committed
635
	softirq_init();
636
	timekeeping_init();
john stultz's avatar
john stultz committed
637
	time_init();
638
	sched_clock_init();
639
640
	profile_init();
	if (!irqs_disabled())
641
642
		printk(KERN_CRIT "start_kernel(): bug: interrupts were "
				 "enabled early\n");
Ingo Molnar's avatar
Ingo Molnar committed
643
	early_boot_irqs_on();
644
	local_irq_enable();
645
646
647
648

	/* Interrupts are enabled now so all GFP allocations are safe. */
	set_gfp_allowed_mask(__GFP_BITS_MASK);

649
	kmem_cache_init_late();
Linus Torvalds's avatar
Linus Torvalds committed
650
651
652
653
654
655
656
657
658

	/*
	 * HACK ALERT! This is early. We're enabling the console before
	 * we've done PCI setups etc, and console_init() must be aware of
	 * this. But we do want output early, in case something goes wrong.
	 */
	console_init();
	if (panic_later)
		panic(panic_later, panic_param);
Ingo Molnar's avatar
Ingo Molnar committed
659
660
661

	lockdep_info();

662
663
664
665
666
667
668
	/*
	 * Need to run this when irqs are enabled, because it wants
	 * to self-test [hard/soft]-irqs on/off lock inversion bugs
	 * too:
	 */
	locking_selftest();

Linus Torvalds's avatar
Linus Torvalds committed
669
670
#ifdef CONFIG_BLK_DEV_INITRD
	if (initrd_start && !initrd_below_start_ok &&
671
	    page_to_pfn(virt_to_page((void *)initrd_start)) < min_low_pfn) {
Linus Torvalds's avatar
Linus Torvalds committed
672
		printk(KERN_CRIT "initrd overwritten (0x%08lx < 0x%08lx) - "
673
		    "disabling it.\n",
674
675
		    page_to_pfn(virt_to_page((void *)initrd_start)),
		    min_low_pfn);
Linus Torvalds's avatar
Linus Torvalds committed
676
677
678
		initrd_start = 0;
	}
#endif
679
	page_cgroup_init();
680
	enable_debug_pagealloc();
681
	cpu_hotplug_init();
682
	kmemtrace_init();
683
	kmemleak_init();
684
	debug_objects_mem_init();
685
	idr_init_cache();
686
	setup_per_cpu_pageset();
Linus Torvalds's avatar
Linus Torvalds committed
687
688
689
690
691
692
693
694
695
696
	numa_policy_init();
	if (late_time_init)
		late_time_init();
	calibrate_delay();
	pidmap_init();
	anon_vma_init();
#ifdef CONFIG_X86
	if (efi_enabled)
		efi_enter_virtual_mode();
#endif
697
	thread_info_cache_init();
698
	cred_init();
Linus Torvalds's avatar
Linus Torvalds committed
699
700
701
702
703
704
705
706
707
708
709
710
711
	fork_init(num_physpages);
	proc_caches_init();
	buffer_init();
	key_init();
	security_init();
	vfs_caches_init(num_physpages);
	radix_tree_init();
	signals_init();
	/* rootfs populating might need page-writeback */
	page_writeback_init();
#ifdef CONFIG_PROC_FS
	proc_root_init();
#endif
712
	cgroup_init();
Linus Torvalds's avatar
Linus Torvalds committed
713
	cpuset_init();
714
	taskstats_init_early();
715
	delayacct_init();
Linus Torvalds's avatar
Linus Torvalds committed
716
717
718
719
720

	check_bugs();

	acpi_early_init(); /* before LAPIC and SMP init */

721
722
	ftrace_init();

Linus Torvalds's avatar
Linus Torvalds committed
723
724
725
726
	/* Do the rest non-__init'ed, we're now alive */
	rest_init();
}

727
728
729
730
731
732
733
734
735
736
737
/* Call all constructor functions linked into the kernel. */
static void __init do_ctors(void)
{
#ifdef CONFIG_CONSTRUCTORS
	ctor_fn_t *call = (ctor_fn_t *) __ctors_start;

	for (; call < (ctor_fn_t *) __ctors_end; call++)
		(*call)();
#endif
}

738
int initcall_debug;
739
core_param(initcall_debug, initcall_debug, bool, 0644);
Linus Torvalds's avatar
Linus Torvalds committed
740

741
int do_one_initcall(initcall_t fn)
Linus Torvalds's avatar
Linus Torvalds committed
742
743
{
	int count = preempt_count();
744
	ktime_t calltime, delta, rettime;
745
	char msgbuf[64];
746
747
	struct boot_trace_call call;
	struct boot_trace_ret ret;
Linus Torvalds's avatar
Linus Torvalds committed
748

749
	if (initcall_debug) {
750
751
752
753
		call.caller = task_pid_nr(current);
		printk("calling  %pF @ %i\n", fn, call.caller);
		calltime = ktime_get();
		trace_boot_call(&call, fn);
754
		enable_boot_trace();
755
	}
Linus Torvalds's avatar
Linus Torvalds committed
756

757
	ret.result = fn();
Linus Torvalds's avatar
Linus Torvalds committed
758

759
	if (initcall_debug) {
760
		disable_boot_trace();
761
762
		rettime = ktime_get();
		delta = ktime_sub(rettime, calltime);
763
		ret.duration = (unsigned long long) ktime_to_ns(delta) >> 10;
764
		trace_boot_ret(&ret, fn);
765
		printk("initcall %pF returned %d after %Ld usecs\n", fn,
766
			ret.result, ret.duration);
767
	}
768

769
	msgbuf[0] = 0;
770

771
772
	if (ret.result && ret.result != -ENODEV && initcall_debug)
		sprintf(msgbuf, "error code %d ", ret.result);
773

774
	if (preempt_count() != count) {
775
		strlcat(msgbuf, "preemption imbalance ", sizeof(msgbuf));
776
		preempt_count() = count;
Linus Torvalds's avatar
Linus Torvalds committed
777
	}
778
	if (irqs_disabled()) {
779
		strlcat(msgbuf, "disabled interrupts ", sizeof(msgbuf));
780
781
782
		local_irq_enable();
	}
	if (msgbuf[0]) {
783
		printk("initcall %pF returned with %s\n", fn, msgbuf);
784
	}
785

786
	return ret.result;
787
788
789
}


790
extern initcall_t __initcall_start[], __initcall_end[], __early_initcall_end[];
791
792
793
794
795

static void __init do_initcalls(void)
{
	initcall_t *call;

796
	for (call = __early_initcall_end; call < __initcall_end; call++)
797
		do_one_initcall(*call);
Linus Torvalds's avatar
Linus Torvalds committed
798
799
800
801
802
803
804
805
806
807
808
809
810
811

	/* Make sure there is no pending stuff from the initcall sequence */
	flush_scheduled_work();
}

/*
 * Ok, the machine is now initialized. None of the devices
 * have been touched yet, but the CPU subsystem is up and
 * running, and memory and process management works.
 *
 * Now we can finally start doing some real work..
 */
static void __init do_basic_setup(void)
{
Paul E. McKenney's avatar
Paul E. McKenney committed
812
	rcu_init_sched(); /* needed by module_init stage. */
813
	init_workqueues();
814
	cpuset_init_smp();
Linus Torvalds's avatar
Linus Torvalds committed
815
816
	usermodehelper_init();
	driver_init();
817
	init_irq_proc();
818
	do_ctors();
Linus Torvalds's avatar
Linus Torvalds committed
819
820
821
	do_initcalls();
}

822
static void __init do_pre_smp_initcalls(void)
823
824
825
826
827
828
829
{
	initcall_t *call;

	for (call = __initcall_start; call < __early_initcall_end; call++)
		do_one_initcall(*call);
}

Linus Torvalds's avatar
Linus Torvalds committed
830
831
832
static void run_init_process(char *init_filename)
{
	argv_init[0] = init_filename;
833
	kernel_execve(init_filename, argv_init, envp_init);
Linus Torvalds's avatar
Linus Torvalds committed
834
835
}

836
837
838
/* This is a non __init function. Force it to be noinline otherwise gcc
 * makes it inline to init() and it becomes part of init.text section
 */
839
static noinline int init_post(void)
840
	__releases(kernel_lock)
841
{
842
843
	/* need to finish all async __init code before freeing the memory */
	async_synchronize_full();
844
845
846
847
848
849
850
851
852
853
854
855
	free_initmem();
	unlock_kernel();
	mark_rodata_ro();
	system_state = SYSTEM_RUNNING;
	numa_default_policy();

	if (sys_open((const char __user *) "/dev/console", O_RDWR, 0) < 0)
		printk(KERN_WARNING "Warning: unable to open an initial console.\n");

	(void) sys_dup(0);
	(void) sys_dup(0);

856
857
	current->signal->flags |= SIGNAL_UNKILLABLE;

858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
	if (ramdisk_execute_command) {
		run_init_process(ramdisk_execute_command);
		printk(KERN_WARNING "Failed to execute %s\n",
				ramdisk_execute_command);
	}

	/*
	 * We try each of these until one succeeds.
	 *
	 * The Bourne shell can be used instead of init if we are
	 * trying to recover a really broken machine.
	 */
	if (execute_command) {
		run_init_process(execute_command);
		printk(KERN_WARNING "Failed to execute %s.  Attempting "
					"defaults...\n", execute_command);
	}
	run_init_process("/sbin/init");
	run_init_process("/etc/init");
	run_init_process("/bin/init");
	run_init_process("/bin/sh");

	panic("No init found.  Try passing init= option to kernel.");
}

883
static int __init kernel_init(void * unused)
Linus Torvalds's avatar
Linus Torvalds committed
884
885
{
	lock_kernel();
886
887
888
889
890

	/*
	 * init can allocate pages on any node
	 */
	set_mems_allowed(node_possible_map);
Linus Torvalds's avatar
Linus Torvalds committed
891
892
893
	/*
	 * init can run on any cpu.
	 */
894
	set_cpus_allowed_ptr(current, cpu_all_mask);
Linus Torvalds's avatar
Linus Torvalds committed
895
896
897
898
899
900
901
902
	/*
	 * Tell the world that we're going to be the grim
	 * reaper of innocent orphaned children.
	 *
	 * We don't want people to have to make incorrect
	 * assumptions about where in the task array this
	 * can be found.
	 */
903
	init_pid_ns.child_reaper = current;
Linus Torvalds's avatar
Linus Torvalds committed
904

905
906
	cad_pid = task_pid(current);

907
	smp_prepare_cpus(setup_max_cpus);
Linus Torvalds's avatar
Linus Torvalds committed
908
909

	do_pre_smp_initcalls();
910
	start_boot_trace();
Linus Torvalds's avatar
Linus Torvalds committed
911
912
913
914
915
916
917
918
919
920

	smp_init();
	sched_init_smp();

	do_basic_setup();

	/*
	 * check if there is an early userspace init.  If yes, let it do all
	 * the work
	 */
921
922
923
924
925
926

	if (!ramdisk_execute_command)
		ramdisk_execute_command = "/init";

	if (sys_access((const char __user *) ramdisk_execute_command, 0) != 0) {
		ramdisk_execute_command = NULL;
Linus Torvalds's avatar
Linus Torvalds committed
927
		prepare_namespace();
928
	}
Linus Torvalds's avatar
Linus Torvalds committed
929
930
931
932
933
934

	/*
	 * Ok, we have completed the initial bootup, and
	 * we're essentially up and running. Get rid of the
	 * initmem segments and start the user-mode stuff..
	 */
935

936
937
	init_post();
	return 0;
Linus Torvalds's avatar
Linus Torvalds committed
938
}