f2dbcfa738
What's happening is that the assertion in mm/page_alloc.c:move_freepages() is triggering: BUG_ON(page_zone(start_page) != page_zone(end_page)); Once I knew this is what was happening, I added some annotations: if (unlikely(page_zone(start_page) != page_zone(end_page))) { printk(KERN_ERR "move_freepages: Bogus zones: " "start_page[%p] end_page[%p] zone[%p]\n", start_page, end_page, zone); printk(KERN_ERR "move_freepages: " "start_zone[%p] end_zone[%p]\n", page_zone(start_page), page_zone(end_page)); printk(KERN_ERR "move_freepages: " "start_pfn[0x%lx] end_pfn[0x%lx]\n", page_to_pfn(start_page), page_to_pfn(end_page)); printk(KERN_ERR "move_freepages: " "start_nid[%d] end_nid[%d]\n", page_to_nid(start_page), page_to_nid(end_page)); ... And here's what I got: move_freepages: Bogus zones: start_page[2207d0000] end_page[2207dffc0] zone[fffff8103effcb00] move_freepages: start_zone[fffff8103effcb00] end_zone[fffff8003fffeb00] move_freepages: start_pfn[0x81f600] end_pfn[0x81f7ff] move_freepages: start_nid[1] end_nid[0] My memory layout on this box is: [ 0.000000] Zone PFN ranges: [ 0.000000] Normal 0x00000000 -> 0x0081ff5d [ 0.000000] Movable zone start PFN for each node [ 0.000000] early_node_map[8] active PFN ranges [ 0.000000] 0: 0x00000000 -> 0x00020000 [ 0.000000] 1: 0x00800000 -> 0x0081f7ff [ 0.000000] 1: 0x0081f800 -> 0x0081fe50 [ 0.000000] 1: 0x0081fed1 -> 0x0081fed8 [ 0.000000] 1: 0x0081feda -> 0x0081fedb [ 0.000000] 1: 0x0081fedd -> 0x0081fee5 [ 0.000000] 1: 0x0081fee7 -> 0x0081ff51 [ 0.000000] 1: 0x0081ff59 -> 0x0081ff5d So it's a block move in that 0x81f600-->0x81f7ff region which triggers the problem. This patch: Declaration of early_pfn_to_nid() is scattered over per-arch include files, and it seems it's complicated to know when the declaration is used. I think it makes fix-for-memmap-init not easy. This patch moves all declaration to include/linux/mm.h After this, if !CONFIG_NODES_POPULATES_NODE_MAP && !CONFIG_HAVE_ARCH_EARLY_PFN_TO_NID -> Use static definition in include/linux/mm.h else if !CONFIG_HAVE_ARCH_EARLY_PFN_TO_NID -> Use generic definition in mm/page_alloc.c else -> per-arch back end function will be called. Signed-off-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com> Tested-by: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com> Reported-by: David Miller <davem@davemlloft.net> Cc: Mel Gorman <mel@csn.ul.ie> Cc: Heiko Carstens <heiko.carstens@de.ibm.com> Cc: <stable@kernel.org> [2.6.25.x, 2.6.26.x, 2.6.27.x, 2.6.28.x] Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> |
||
---|---|---|
.. | ||
native | ||
sn | ||
uv | ||
xen | ||
acpi-ext.h | ||
acpi.h | ||
agp.h | ||
asmmacro.h | ||
atomic.h | ||
auxvec.h | ||
bitops.h | ||
break.h | ||
bug.h | ||
bugs.h | ||
byteorder.h | ||
cache.h | ||
cacheflush.h | ||
checksum.h | ||
compat.h | ||
cpu.h | ||
cputime.h | ||
current.h | ||
cyclone.h | ||
delay.h | ||
device.h | ||
div64.h | ||
dma-mapping.h | ||
dma.h | ||
dmi.h | ||
elf.h | ||
emergency-restart.h | ||
errno.h | ||
esi.h | ||
fb.h | ||
fcntl.h | ||
fpswa.h | ||
fpu.h | ||
futex.h | ||
gcc_intrin.h | ||
hardirq.h | ||
hpsim.h | ||
hugetlb.h | ||
hw_irq.h | ||
ia32.h | ||
ia64regs.h | ||
intel_intrin.h | ||
intrinsics.h | ||
io.h | ||
ioctl.h | ||
ioctls.h | ||
iommu.h | ||
iosapic.h | ||
ipcbuf.h | ||
irq.h | ||
irq_regs.h | ||
Kbuild | ||
kdebug.h | ||
kexec.h | ||
kmap_types.h | ||
kprobes.h | ||
kregs.h | ||
kvm.h | ||
kvm_host.h | ||
kvm_para.h | ||
libata-portmap.h | ||
linkage.h | ||
local.h | ||
machvec.h | ||
machvec_dig.h | ||
machvec_dig_vtd.h | ||
machvec_hpsim.h | ||
machvec_hpzx1.h | ||
machvec_hpzx1_swiotlb.h | ||
machvec_init.h | ||
machvec_sn2.h | ||
machvec_uv.h | ||
machvec_xen.h | ||
mc146818rtc.h | ||
mca.h | ||
mca_asm.h | ||
meminit.h | ||
mman.h | ||
mmu.h | ||
mmu_context.h | ||
mmzone.h | ||
module.h | ||
msgbuf.h | ||
mutex.h | ||
nodedata.h | ||
numa.h | ||
page.h | ||
pal.h | ||
param.h | ||
paravirt.h | ||
paravirt_privop.h | ||
parport.h | ||
patch.h | ||
pci.h | ||
percpu.h | ||
perfmon.h | ||
perfmon_default_smpl.h | ||
pgalloc.h | ||
pgtable.h | ||
poll.h | ||
posix_types.h | ||
processor.h | ||
ptrace.h | ||
ptrace_offsets.h | ||
pvclock-abi.h | ||
resource.h | ||
rse.h | ||
rwsem.h | ||
sal.h | ||
scatterlist.h | ||
sections.h | ||
segment.h | ||
sembuf.h | ||
serial.h | ||
setup.h | ||
shmbuf.h | ||
shmparam.h | ||
sigcontext.h | ||
siginfo.h | ||
signal.h | ||
smp.h | ||
socket.h | ||
sockios.h | ||
sparsemem.h | ||
spinlock.h | ||
spinlock_types.h | ||
stat.h | ||
statfs.h | ||
string.h | ||
suspend.h | ||
swab.h | ||
swiotlb.h | ||
sync_bitops.h | ||
syscall.h | ||
system.h | ||
termbits.h | ||
termios.h | ||
thread_info.h | ||
timex.h | ||
tlb.h | ||
tlbflush.h | ||
topology.h | ||
types.h | ||
uaccess.h | ||
ucontext.h | ||
unaligned.h | ||
uncached.h | ||
unistd.h | ||
unwind.h | ||
user.h | ||
ustack.h | ||
vga.h | ||
xor.h |