[PATCH] 2.4.25-rc1: Shutdown kernel on zone-alignment failure

From: Michael Frank
Date: Fri Feb 06 2004 - 16:39:43 EST


Marcelo,

The following is applicable to all architectures using zones.

When zone alignment goes wrong, a message is printed:
BUG: wrong zone alignment, it will crash

_BUT_ kernel runs until it dies of the alignment problems - it took me
hours until I found the message after looking elsewhere ;)

This patch:

- Should zone alignment fail, it will force a BUG() once the BUG handler inits

- Improves the messages of zone init to help debug zone alignment problems

Please apply.

The highmem autoalignment patch will follow after more testing.

Regards
Michael


diff -uN -r -X /home/mhf/sys/dont/dontdiff linux-2.4.25-rc1-Vanilla/include/linux/kernel.h linux-2.4.25-rc1-mhf176/include/linux/kernel.h
--- linux-2.4.25-rc1-Vanilla/include/linux/kernel.h 2004-02-06 17:09:26.000000000 +0800
+++ linux-2.4.25-rc1-mhf176/include/linux/kernel.h 2004-02-07 04:43:49.000000000 +0800
@@ -45,7 +45,7 @@
#define minimum_console_loglevel (console_printk[2])
#define default_console_loglevel (console_printk[3])

-# define NORET_TYPE /**/
+# define NORET_TYPE
# define ATTRIB_NORET __attribute__((noreturn))
# define NORET_AND noreturn,

@@ -104,7 +104,7 @@

extern void bust_spinlocks(int yes);
extern int oops_in_progress; /* If set, an oops, panic(), BUG() or die() is in progress */
-
+extern int force_bug; /* If set, BUG() will be forced when handler initialized */
extern int tainted;
extern const char *print_tainted(void);

diff -uN -r -X /home/mhf/sys/dont/dontdiff linux-2.4.25-rc1-Vanilla/init/main.c linux-2.4.25-rc1-mhf176/init/main.c
--- linux-2.4.25-rc1-Vanilla/init/main.c 2004-02-06 17:06:58.000000000 +0800
+++ linux-2.4.25-rc1-mhf176/init/main.c 2004-02-07 05:11:07.000000000 +0800
@@ -121,6 +121,7 @@
extern void time_init(void);
extern void softirq_init(void);

+int force_bug;
int rows, cols;

char *execute_command;
@@ -422,6 +423,14 @@
ccwcache_init();
#endif
signals_init();
+
+ /*
+ * Something went badly wrong during the early initialisation process,
+ * so lets die before doing any damage or wasting people's time
+ * running a half dead kernel.
+ */
+ if (force_bug)
+ BUG();
#ifdef CONFIG_PROC_FS
proc_root_init();
#endif
diff -uN -r -X /home/mhf/sys/dont/dontdiff linux-2.4.25-rc1-Vanilla/mm/page_alloc.c linux-2.4.25-rc1-mhf176/mm/page_alloc.c
--- linux-2.4.25-rc1-Vanilla/mm/page_alloc.c 2004-02-06 17:06:58.000000000 +0800
+++ linux-2.4.25-rc1-mhf176/mm/page_alloc.c 2004-02-07 04:48:30.000000000 +0800
@@ -726,8 +726,8 @@
unsigned long i, j;
unsigned long map_size;
unsigned long totalpages, offset, realtotalpages;
- const unsigned long zone_required_alignment = 1UL << (MAX_ORDER-1);
-
+ const unsigned long zone_required_alignment = 1UL << (PAGE_SHIFT + MAX_ORDER-1);
+ unsigned long zone_bad_alignment;
if (zone_start_paddr & ~PAGE_MASK)
BUG();

@@ -741,7 +741,8 @@
for (i = 0; i < MAX_NR_ZONES; i++)
realtotalpages -= zholes_size[i];

- printk("On node %d totalpages: %lu\n", nid, realtotalpages);
+ printk("On node %d totalpages: %lu, zones aligned at 0x%lx\n",
+ nid, realtotalpages,zone_required_alignment);

/*
* Some architectures (with lots of mem and discontinous memory
@@ -774,7 +775,20 @@
if (zholes_size)
realsize -= zholes_size[j];

- printk("zone(%lu): %lu pages.\n", j, size);
+ printk("zone(%lu): %lu pages, physical start address at 0x%lx\n",
+ j, size,zone_start_paddr);
+
+ /*
+ * Here the alignment of a zone is checked. Should alignment
+ * be wrong, all that can be done is to print an error message
+ * and defer the the BUG handler as it is not yet initialized.
+ */
+ if ((zone_bad_alignment = (zone_start_paddr & (zone_required_alignment-1)))) {
+ printk("zone(%lu): FATAL ERROR: wrong zone alignment 0x%lx"
+ " - will force kernel BUG\n",
+ j,zone_bad_alignment);
+ force_bug = 1;
+ }
zone->size = size;
zone->realsize = realsize;
zone->name = zone_names[j];
@@ -784,7 +798,6 @@
zone->need_balance = 0;
zone->nr_active_pages = zone->nr_inactive_pages = 0;

-
if (!size)
continue;

@@ -837,8 +850,6 @@
zone->zone_start_mapnr = offset;
zone->zone_start_paddr = zone_start_paddr;

- if ((zone_start_paddr >> PAGE_SHIFT) & (zone_required_alignment-1))
- printk("BUG: wrong zone alignment, it will crash\n");

/*
* Initially all pages are reserved - free ones are freed

-
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/