From mboxrd@z Thu Jan 1 00:00:00 1970 From: MaoXiaoyun Subject: RE: Kernel BUG at arch/x86/mm/tlb.c:61 Date: Thu, 14 Apr 2011 14:16:24 +0800 Message-ID: References: , , , , , , , <4DA3438A.6070503@goop.org>, , , <20110412100000.GA15647@dumpdata.com> Mime-Version: 1.0 Content-Type: multipart/mixed; boundary="===============0760198219==" Return-path: In-Reply-To: <20110412100000.GA15647@dumpdata.com> List-Unsubscribe: , List-Post: List-Help: List-Subscribe: , Sender: xen-devel-bounces@lists.xensource.com Errors-To: xen-devel-bounces@lists.xensource.com To: xen devel Cc: jeremy@goop.org, giamteckchoon@gmail.com, konrad.wilk@oracle.com List-Id: xen-devel@lists.xenproject.org --===============0760198219== Content-Type: multipart/alternative; boundary="_702121fa-b4c8-4aa3-b55a-69720ad5fc06_" --_702121fa-b4c8-4aa3-b55a-69720ad5fc06_ Content-Type: text/plain; charset="gb2312" Content-Transfer-Encoding: quoted-printable Hi: =20 I've done test with "cpuidle=3D0 cpufreq=3Dnone", two machine crash= ed. =20 blktap_sysfs_destroy blktap_sysfs_destroy blktap_sysfs_create: adding attributes for dev ffff8800ad581000 blktap_sysfs_create: adding attributes for dev ffff8800a48e3e00 ------------[ cut here ]------------ kernel BUG at arch/x86/mm/tlb.c:61! invalid opcode: 0000 [#1] SMP=20 last sysfs file: /sys/block/tapdeve/dev CPU 0=20 Modules linked in: 8021q garp blktap xen_netback xen_blkback blkback_page= map nbd bridge stp llc autofs4 ipmi_devintf ipmi_si ipmi_ms ghandler lockd sunrpc bonding ipv6 xenfs dm_multipath video output sbs sb= shc parport_pc lp parport ses enclosure snd_seq_dummy bnx2=20 serio_raw snd_seq_oss snd_seq_midi_event snd_seq snd_seq_device snd_pcm_o= ss snd_mixer_oss snd_pcm i2c_i801 snd_timer i2c_core snd iT CO_wdt pata_acpi soundcore iTCO_vendor_ support ata_generic snd_page_alloc pcspkr ata_piix shpchp mptsas mptscsih= mptbase [last unloa ded: freq_table] Pid: 8022, comm: khelper Not tainted 2.6.32.36xen #1 Tecal RH2285 = =20 RIP: e030:[] [] leave_mm+0x15/0x46 RSP: e02b:ffff88002803ee48 EFLAGS: 00010046 RAX: 0000000000000000 RBX: 0000000000000001 RCX: ffffffff81675980 RDX: ffff88002803ee78 RSI: 0000000000000000 RDI: 0000000000000000 RBP: ffff88002803ee48 R08: ffff8800a4929000 R09: dead000000200200 R10: dead000000100100 R11: ffffffff81447292 R12: ffff88012ba07b80 R13: ffff880028046020 R14: 00000000000004fb R15: 0000000000000000 FS: 00007f410af416e0(0000) GS:ffff88002803b000(0000) knlGS:0000000000000= 000 CS: e033 DS: 0000 ES: 0000 CR0: 000000008005003b CR2: 0000000000469000 CR3: 00000000ad639000 CR4: 0000000000002660 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400 Process khelper (pid: 8022, threadinfo ffff8800a4846000, task ffff8800a9e= d0000) Stack: ffff88002803ee68 ffffffff8100e4a4 0000000000000001 ffff880097de3b88 <0> ffff88002803ee98 ffffffff81087224 ffff88002803ee78 ffff88002803ee78 <0> ffff88015f808180 00000000000004fb ffff88002803eea8 ffffffff810100e8 Call Trace: =20 [] drop_other_mm_ref+0x2a/0x53 [] generic_smp_call_function_single_interrupt+0xd8/0xf= c [] xen_call_function_single_interrupt+0x13/0x28 [] handle_IRQ_event+0x66/0x120 [] handle_percpu_irq+0x41/0x6e [] __xen_evtchn_do_upcall+0x1ab/0x27d [] xen_evtchn_do_upcall+0x33/0x46 [] xen_do_hypervisor_callback+0x1e/0x30 =20 [] ? _spin_unlock_irqrestore+0x15/0x17 [] ? xen_restore_fl_direct_end+0x0/0x1 [] ? flush_old_exec+0x3ac/0x500 [] ? load_elf_binary+0x0/0x17ef [] ? load_elf_binary+0x0/0x17ef [] ? load_elf_binary+0x398/0x17ef [] ? need_resched+0x23/0x2d =20 [] ? process_measurement+0xc0/0xd7 [] ? load_elf_binary+0x0/0x17ef [] ? search_binary_handler+0xc8/0x255 [] ? do_execve+0x1c3/0x29e [] ? sys_execve+0x43/0x5d [] ? __call_usermodehelper+0x0/0x6f [] ? kernel_execve+0x68/0xd0 [] ? __call_usermodehelper+0x0/0x6f [] ? xen_restore_fl_direct_end+0x0/0x1 [] ? ____call_usermodehelper+0x113/0x11e [] ? child_rip+0xa/0x20 [] ? __call_usermodehelper+0x0/0x6f [] ? int_ret_from_sys_call+0x7/0x1b [] ? retint_restore_args+0x5/0x6 [] ? c hild_rip+0x0/0x20 Code: 41 5e 41 5f c9 c3 55 48 89 e5 0f 1f 44 00 00 e8 17 ff ff ff c9 c3 5= 5 48 89 e5 0f 1f 44 00 00 65 8b 04 25 c8 55 01 00 ff c8 75 04 <0f> 0b eb = fe 65 48 8b 34 25 c0 55 01 00 48 81 c6 b8 02 00 00 e8=20 RIP [] leave_mm+0x15/0x46 RSP ---[ end trace 1522f17fdfc9162d ]--- Kernel panic - not syncing: Fatal exception in interrupt Pid: 8022, comm: khelper Tainted: G D 2.6.32.36xen #1 Call Trace: [] panic+0xe0/0x19a [] ? init_amd+0x296/0x37a [] ? xen_force_evtchn_callback+0xd/0xf [] ? check_events+0x12/0x20 [] ? xen_restore_fl_direct_end+0x0/0x1 [] ? print_oops_end_marker+0x23/0x25 [] oops_end+0xb6/0xc6 [] die+0x5a/0x63 [] do_trap+0x115/0x124 [] do_invalid_op+0x9c/0xa5 [] ? leave_mm+0x15/0x46 [] ? xen_clocksource_read+0x21/0x23 [] ? HYPERVISOR_vcpu_op+0xf/0x11 [] ? xen_vcpuop_set_next_event+0x52/0x67 [] invalid_op+0x1b/0x20 [] ? _spin_unlock_irqrestore+0x15/0x17 [] ? leave_mm+0x15/0x46 [] drop_other_mm_ref+0x2a/0x53 [] generic_smp_call_function_single_interrupt+0xd8/0xf= c [] xen_call_function_single_interrupt+0x13/0x28 [] handle_IRQ_event+0x66/0x120 [] handle_percpu_irq+0x41/0x6e [] __xen_evtchn_do_upcall+0x1ab/0x27d [] xen_evtchn_do_upcall+0x33/0x46 [] xen_do_hypervisor_callback+0x1e/0x30 [] ? _spin_unlock_irqrestore+0x15/0x17 [] ? xen_restore_fl_direct_end+0x0/0x1 [] ? flush_old_exec+0x3ac/0x500 [] ? load_elf_binary+0x0/0x17ef [] ? load_elf_binary+0x0/0x17ef [] ? load_elf_binary+0x398/0x17ef [] ? need_resched+0x23/0x 2d [] ? process_measurement+0xc0/0xd7 [] ? load_elf_binary+0x0/0x17ef [] ? search_binary_handler+0xc8/0x255 [] ? do_execve+0x1c3/0x29e [] ? sys_execve+0x43/0x5d [] ? __call_usermodehelper+0x0/0x6f [] ? kernel_execve+0x68/0xd0 [] ? __call_usermodehelper+0x0/0x6f [] ? xen_restore_fl_direct_end+0x0/0x1 [] ? ____call_usermodehelper+0x113/0x11e [] ? child_rip+0xa/0x20 [] ? __call_usermodehelper+0x0/0x6f [] ? int_ret_from_sys_call+0x7/0x1b [] ? retint_restore_args+0x5/0x6 [] ? child_rip+0x0/0x20 (XEN) Domain 0 crashed: 'noreboot' set - not rebooting. =20 > Date: Tue, 12 Apr 2011 06:00:00 -0400 > From: konrad.wilk@oracle.com > To: tinnycloud@hotmail.com > CC: xen-devel@lists.xensource.com; giamteckchoon@gmail.com; jeremy@goop= .org > Subject: Re: Kernel BUG at arch/x86/mm/tlb.c:61 >=20 > On Tue, Apr 12, 2011 at 05:11:51PM +0800, MaoXiaoyun wrote: > >=20 > > Hi : > >=20 > > We are using pvops kernel 2.6.32.36 + xen 4.0.1, but confront a kerne= l panic bug. > >=20 > > 2.6.32.36 Kernel: http://git.kernel.org/?p=3Dlinux/kernel/git/jeremy/= xen.git;a=3Dcommit;h=3Dbb1a15e55ec665a64c8a9c6bd699b1f16ac01ff4 > > Xen 4.0.1 http://xenbits.xen.org/hg/xen-4.0-testing.hg/rev/b536ebfba1= 83=20 > >=20 > > Our test is simple, 24 HVMS(Win2003 ) on a single host, each HVM loop= es in restart every 15minutes. >=20 > What is the storage that you are using for your guests? AoE? Local disk= s? >=20 > > About 17 machines are invovled in the test, after 10 hours run, one c= onfrontted a crash at arch/x86/mm/tlb.c:61 > >=20 > > Currently I am trying "cpuidle=3D0 cpufreq=3Dnone" tests based on Tec= k's suggestion. > >=20 > > Any comments, thanks.=20 > >=20 > > =3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3Dcrash log=3D=3D=3D=3D=3D= =3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D > > INIT: Id "s0" respawning too fast: disabled for 5 minutes > > __ratelimit: 14 callbacks suppressed > > blktap_sysfs_destroy > > blktap_sysfs_destroy > > ------------[ cut here ]------------ > > kernel BUG at arch/x86/mm/tlb.c:61! > > invalid opcode: 0000 [#1] SMP=20 > > last sysfs file: /sys/devices/system/xen_memory/xen_memory0/info/curr= ent_kb > > CPU 1=20 > > Modules linked in: 8021q garp xen_netback xen_blkback blktap blkback_= pagemap nbd bridge stp llc autofs4 ipmi_devintf ipmi_si ipmi_msghandler l= ockd sunrpc bonding ipv6 xenfs dm_multipath video output sbs sbshc parpor= t_pc lp parport ses enclosure snd_seq_dummy snd_seq_oss snd_seq_midi_even= t snd_seq snd_seq_device serio_raw bnx2 snd_pcm_oss snd_mixer_oss snd_pcm= snd_timer iTCO_wdt snd soundcore snd_page_alloc i2c_i801 iTCO_vendor_sup= port i2c_core pcspkr pata_acpi ata_generic ata_piix shpchp mptsas mptscsi= h mptbase [last unloaded: freq_table] > > Pid: 25581, comm: khelper Not tainted 2.6.32.36fixxen #1 Tecal RH2285= =20 > > RIP: e030:[] [] leave_mm+0x15/0x4= 6 > > RSP: e02b:ffff88002805be48 EFLAGS: 00010046 > > RAX: 0000000000000000 RBX: 0000000000000001 RCX: ffff88015f8e2da0 > > RDX: ffff88002805be78 RSI: 0000000000000000 RDI: 0000000000000001 > > RBP: ffff88002805be48 R08: ffff88009d662000 R09: dead000000200200 > > R10: dead000000100100 R11: ffffffff814472b2 R12: ffff88009bfc1880 > > R13: ffff880028063020 R14: 00000000000004f6 R15: 0000000000000000 > > FS: 00007f62362d66e0(0000) GS:ffff880028058000(0000) knlGS:0000000000= 000000 > > CS: e033 DS: 0000 ES: 0000 CR0: 000000008005003b > > CR2: 0000003aabc11909 CR3: 000000009b8ca000 CR4: 0000000000002660 > > DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 > > DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400 > > Process khelper (pid: 25581, threadinfo ffff88007691e000, task ffff88= 009b92db40) > > Stack: > > ffff88002805be68 ffffffff8100e4ae 0000000000000001 ffff88009d733b88 > > <0> ffff88002805be98 ffffffff81087224 ffff88002805be78 ffff88002805be= 78 > > <0> ffff88015f808360 00000000000004f6 ffff88002805bea8 ffffffff810101= 08 > > Call Trace: > > =20 > > [] drop_other_mm_ref+0x2a/0x53 > > [] generic_smp_call_function_single_interrupt+0xd8/= 0xfc > > [] xen_call_function_single_interrupt+0x13/0x28 > > [] handle_IRQ_event+0x66/0x120 > > [] handle_percpu_irq+0x41/0x6e > > [] __xen_evtchn_do_upcall+0x1ab/0x27d > > [] xen_evtchn_do_upcall+0x33/0x46 > > [] xen_do_hypervisor_callback+0x1e/0x30 > > =20 > > [] ? _spin_unlock_irqrestore+0x15/0x17 > > [] ? xen_restore_fl_direct_end+0x0/0x1 > > [] ? flush_old_exec+0x3ac/0x500 > > [] ? load_elf_binary+0x0/0x17ef > > [] ? load_elf_binary+0x0/0x17ef > > [] ? load_elf_binary+0x398/0x17ef > > [] ? need_resched+0x23/0x2d > > [] ? process_measurement+0xc0/0xd7 > > [] ? load_elf_binary+0x0/0x17ef > > [] ? search_binary_handler+0xc8/0x255 > > [] ? do_execve+0x1c3/0x29e > > [] ? sys_execve+0x43/0x5d > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? kernel_execve+0x68/0xd0 > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? xen_restore_fl_direct_end+0x0/0x1 > > [] ? ____call_usermodehelper+0x113/0x11e > > [] ? child_rip+0xa/0x20 > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? int_ret_from_sys_call+0x7/0x1b > > [] ? retint_restore_args+0x5/0x6 > > [] ? child_rip+0x0/0x20 > > Code: 41 5e 41 5f c9 c3 55 48 89 e5 0f 1f 44 00 00 e8 17 ff ff ff c9 = c3 55 48 89 e5 0f 1f 44 00 00 65 8b 04 25 c8 55 01 00 ff c8 75 04 <0f> 0b= eb fe 65 48 8b 34 25 c0 55 01 00 48 81 c6 b8 02 00 00 e8=20 > > RIP [] leave_mm+0x15/0x46 > > RSP > > ---[ end trace ce9cee6832a9c503 ]--- > > Kernel panic - not syncing: Fatal exception in interrupt > > Pid: 25581, comm: khelper Tainted: G D 2.6.32.36fixxen #1 > > Call Trace: > > [] panic+0xe0/0x19a > > [] ? init_amd+0x296/0x37a > > [] ? xen_force_evtchn_callback+0xd/0xf > > [] ? check_events+0x12/0x20 > > [] ? xen_restore_fl_direct_end+0x0/0x1 > > [] ? print_oops_end_marker+0x23/0x25 > > [] oops_end+0xb6/0xc6 > > [] die+0x5a/0x63 > > [] do_trap+0x115/0x124 > > [] do_invalid_op+0x9c/0xa5 > > [] ? leave_mm+0x15/0x46 > > [] ? xen_clocksource_read+0x21/0x23 > > [] ? HYPERVISOR_vcpu_op+0xf/0x11 > > [] ? xen_vcpuop_set_next_event+0x52/0x67 > > [] ? clockevents_program_event+0x78/0x81 > > [] invalid_op+0x1b/0x20 > > [] ? _spin_unlock_irqrestore+0x15/0x17 > > [] ? leave_mm+0x15/0x46 > > [] drop_other_mm_ref+0x2a/0x53 > > [] generic_smp_call_function_single_interrupt+0xd8/= 0xfc > > [] xen_call_function_single_interrupt+0x13/0x28 > > [] handle_IRQ_event+0x66/0x120 > > [] handle_percpu_irq+0x41/0x6e > > [] __xen_evtchn_do_upcall+0x1ab/0x27d > > [] xen_evtchn_do_upcall+0x33/0x46 > > [] xen_do_hypervisor_callback+0x1e/0x30 > > [] ? _spin_unlock_irqrestore+0x15/0x17 > > [] ? xen_restore_fl_direct_end+0x0/0x1 > > [] ? flush_old_exec+0x3ac/0x500 > > [] ? load_elf_binary+0x0/0x17ef > > [] ? load_elf_binary+0x0/0x17ef > > [] ? load_elf_binary+0x398/0x17ef > > [] ? need_resched+0x23/0x2d > > [] ? process_measurement+0xc0/0xd7 > > [] ? load_elf_binary+0x0/0x17ef > > [] ? search_binary_handler+0xc8/0x255 > > [] ? do_execve+0x1c3/0x29e > > [] ? sys_execve+0x43/0x5d > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? kernel_execve+0x68/0xd0 > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? xen_restore_fl_direct_end+0x0/0x1 > > [] ? ____call_usermodehelper+0x113/0x11e > > [] ? child_rip+0xa/0x20 > > [] ? __call_usermodehelper+0x0/0x6f > > [] ? int_ret_from_sys_call+0x7/0x1b > > [] ? retint_restore_args+0x5/0x6 > > [] ? child_rip+0x0/0x20 > >=20 > >=20 =20 --_702121fa-b4c8-4aa3-b55a-69720ad5fc06_ Content-Type: text/html; charset="gb2312" Content-Transfer-Encoding: quoted-printable Hi:
 
      I've done test with "cpuidle=3D0 cpufreq=3D= none", two machine crashed.
 
blktap_sysfs_destroy
blktap_sysfs_dest= roy
blktap_sysfs_create: adding attributes for dev=  ffff8800ad581000
blktap_sysfs_create: adding attribute= s for dev ffff8800a48e3e00
------------[ cut = here ]------------
kernel BUG at arch/x86/mm/tlb.c= :61!
invalid opcode: 0000 [#1] SMP 
last&n= bsp;sysfs file: /sys/block/tapdeve/dev
CPU 0 
M= odules linked in: 8021q garp blktap xen_net= back xen_blkback blkback_pagemap nbd bridge stp&= nbsp;llc autofs4 ipmi_devintf ipmi_si ipmi_ms
ghan= dler lockd sunrpc bonding ipv6 xenfs dm_mul= tipath video output sbs sbshc parport_pc lp=  parport ses enclosure snd_seq_dummy bnx2 <= BR>serio_raw snd_seq_oss snd_seq_midi_event&n bsp;snd_seq snd_seq_device snd_pcm_oss snd_mixer_oss = ;snd_pcm i2c_i801 snd_timer i2c_core snd iT
C= O_wdt pata_acpi soundcore iTCO_vendor_

support ata_generic snd_page_alloc pcspkr ata_pii= x shpchp mptsas mptscsih mptbase [last unlo= a
ded: freq_table]
Pid: 8022, comm: khelper&nbs= p;Not tainted 2.6.32.36xen #1 Tecal RH2285 =          
RIP: e030:= [<ffffffff8103a3cb>]  [<ffffffff8103a3cb>] lea= ve_mm+0x15/0x46
RSP: e02b:ffff88002803ee48  EFLAGS:&nbs= p;00010046
RAX: 0000000000000000 RBX: 0000000000000001&= nbsp;RCX: ffffffff81675980
RDX: ffff88002803ee78 RSI:&n= bsp;0000000000000000 RDI: 0000000000000000
RBP: ffff880= 02803ee48 R08: ffff8800a4929000 R09: dead00000 0200200
R10: dead000000100100 R11: ffffffff81447292&nb= sp;R12: ffff88012ba07b80
R13: ffff880028046020 R14:&nbs= p;00000000000004fb R15: 0000000000000000
FS:  0000= 7f410af416e0(0000) GS:ffff88002803b000(0000) knlGS:000000000000= 0000
CS:  e033 DS: 0000 ES: 0000 CR= 0: 000000008005003b
CR2: 0000000000469000 CR3: 000= 00000ad639000 CR4: 0000000000002660
DR0: 00000000000000= 00 DR1: 0000000000000000 DR2: 0000000000000000
DR3= : 0000000000000000 DR6: 00000000ffff0ff0 DR7: 00= 00000000000400
Process khelper (pid: 8022, threadi= nfo ffff8800a4846000, task ffff8800a9ed0000)
Stack:
=  ffff88002803ee68 ffffffff8100e4a4 0000000000000001 f= fff880097de3b88
<0> ffff88002803ee98 ffffffff81087224&= nbsp;ffff88002803ee78 ffff88002803ee7 8
<0> ffff88015f808180 00000000000004fb ffff8800= 2803eea8 ffffffff810100e8
Call Trace:
 <IRQ>&n= bsp;
 [<ffffffff8100e4a4>] drop_other_mm_ref+0x2a/0x53=
 [<ffffffff81087224>] generic_smp_call_function_singl= e_interrupt+0xd8/0xfc
 [<ffffffff810100e8>] xen_call_f= unction_single_interrupt+0x13/0x28
 [<ffffffff810a936a>]&nb= sp;handle_IRQ_event+0x66/0x120
 [<ffffffff810aac5b>] h= andle_percpu_irq+0x41/0x6e
 [<ffffffff8128c1a8>] __xen= _evtchn_do_upcall+0x1ab/0x27d
 [<ffffffff8128dcf9>] xe= n_evtchn_do_upcall+0x33/0x46
 [<ffffffff81013efe>] xen= _do_hypervisor_callback+0x1e/0x30
 <EOI> 
 [&l= t;ffffffff81447292>] ? _spin_unlock_irqrestore+0x15/0x17
=  [<ffffffff8100f8af>] ? xen_restore_fl_direct_end+0x= 0/0x1
 [<ffffffff81113f75>]& nbsp;? flush_old_exec+0x3ac/0x500
 [<ffffffff81150dc9>= ;] ? load_elf_binary+0x0/0x17ef
 [<ffffffff81150dc9&= gt;] ? load_elf_binary+0x0/0x17ef
 [<ffffffff8115116= 1>] ? load_elf_binary+0x398/0x17ef
 [<ffffffff810= 42fcf>] ? need_resched+0x23/0x2d
 
[<ffffffff8= 11f463c>] ? process_measurement+0xc0/0xd7
 [<ffff= ffff81150dc9>] ? load_elf_binary+0x0/0x17ef
 [<ff= ffffff81113098>] ? search_binary_handler+0xc8/0x255
 = ;[<ffffffff81114366>] ? do_execve+0x1c3/0x29e
 [&= lt;ffffffff8101155d>] ? sys_execve+0x43/0x5d
 [<f= fffffff8106fc45>] ? __call_usermodehelper+0x0/0x6f
 = [<ffffffff81013e28>] ? kernel_execve+0x68/0xd0
 [= <ffffffff8106fc45>] ? __call_usermodehelper+0x0/0x6f
&= nbsp;[<ffffffff8100f8af>] ?&nbs p;xen_restore_fl_direct_end+0x0/0x1
 [<ffffffff8106fb64>]&= nbsp;? ____call_usermodehelper+0x113/0x11e
 [<ffffffff810= 13daa>] ? child_rip+0xa/0x20
 [<ffffffff8106fc45&= gt;] ? __call_usermodehelper+0x0/0x6f
 [<ffffffff810= 12f91>] ? int_ret_from_sys_call+0x7/0x1b
 [<fffff= fff8101371d>] ? retint_restore_args+0x5/0x6
 [<ff= ffffff81013da0>] ? c
hild_rip+0x0/0x20
Code: 41 5e 41 5f c9&nb= sp;c3 55 48 89 e5 0f 1f 44 00&nbs= p;00 e8 17 ff ff ff c9 c3 55 = ;48 89 e5 0f 1f 44 00 00 65 = 8b 04 25 c8 55 01 00 ff c8 7= 5 04 <0f> 0b eb fe 65 48 8b=  34 25 c0 55 01 00 48 81 c6&= nbsp;b8 02 00 00 e8 
RIP  [<ffff= ffff8103a3cb>] leave_mm+0x15/0x46
 RSP <ffff88002= 803ee48>
---[ end trace 1522f17fdfc9162d ]---Kernel panic - not syncing: Fatal  exception in interrupt
Pid: 8022, comm: khel= per Tainted: G      D  =   2.6.32.36xen #1
Call Trace:
 <IRQ>=   [<ffffffff8105682e>] panic+0xe0/0x19a
 [&l= t;ffffffff8144006a>] ? init_amd+0x296/0x37a
 [<ff= ffffff8100f169>] ? xen_force_evtchn_callback+0xd/0xf
&nbs= p;[<ffffffff8100f8c2>] ? check_events+0x12/0x20
 = [<ffffffff8100f8af>] ? xen_restore_fl_direct_end+0x0/0x1<= BR> [<ffffffff81056487>] ? print_oops_end_marker+0x2= 3/0x25
 [<ffffffff81448165>] oops_end+0xb6/0xc6
&nb= sp;[<ffffffff810166e5>] die+0x5a/0x63
 [<ffffffff81= 447a3c>] do_trap+0x115/0x124
 [<ffffffff810148e6>]&= nbsp;do_invalid_op+0x9c/0xa5
 [<ffffffff8103a3cb>] ?&n= bsp;leave_mm+0x15/0x46
 [<fffff fff8100f6e6>] ? xen_clocksource_read+0x21/0x23
 [&l= t;ffffffff8100f258>] ? HYPERVISOR_vcpu_op+0xf/0x11
 = [<ffffffff8100f753>] ? xen_vcpuop_set_next_event+0x52/0x6= 7
 [<ffffffff81013b3b>] invalid_op+0x1b/0x20
 = [<ffffffff81447292>] ? _spin_unlock_irqrestore+0x15/0x17<= BR> [<ffffffff8103a3cb>] ? leave_mm+0x15/0x46
&nb= sp;[<ffffffff8100e4a4>] drop_other_mm_ref+0x2a/0x53
 [= <ffffffff81087224>] generic_smp_call_function_single_interrupt= +0xd8/0xfc
 [<ffffffff810100e8>] xen_call_function_sin= gle_interrupt+0x13/0x28
 [<ffffffff810a936a>] handle_I= RQ_event+0x66/0x120
 [<ffffffff810aac5b>] handle_percp= u_irq+0x41/0x6e
 [<ffffffff8128c1a8>] __xen_evtchn_do_= upcall+0x1ab/0x27d
 [<ffffffff8128dcf9>] xen_evtchn_do= _upcall+0x33/0x46
 [<ffffffff81 013efe>] xen_do_hypervisor_callback+0x1e/0x30
 <EOI&g= t;  [<ffffffff81447292>] ? _spin_unlock_irqrest= ore+0x15/0x17
 [<ffffffff8100f8af>] ? xen_restore= _fl_direct_end+0x0/0x1
 [<ffffffff81113f75>] ? fl= ush_old_exec+0x3ac/0x500
 [<ffffffff81150dc9>] ? = load_elf_binary+0x0/0x17ef
 [<ffffffff81150dc9>] ?&nbs= p;load_elf_binary+0x0/0x17ef
 [<ffffffff81151161>] ?&n= bsp;load_elf_binary+0x398/0x17ef
 [<ffffffff81042fcf>] = ;? need_resched+0x23/0x
2d
 [<ffffffff811f463c>]&nb= sp;? process_measurement+0xc0/0xd7
 [<ffffffff81150dc9>= ;] ? load_elf_binary+0x0/0x17ef
 [<ffffffff81113098&= gt;] ? search_binary_handler+0xc8/0x255
 [<ffffffff8= 1114366>] ? do_execve+0x1c3/0x29e
 [<ffffffff8101= 155d>] ? sys_execve+0x43/0x5d
 [<ffffffff8106fc45>] ? __call_usermodehelper+0= x0/0x6f
 [<ffffffff81013e28>] ? kernel_execve+0x6= 8/0xd0
 [<ffffffff8106fc45>] ? __call_usermodehel= per+0x0/0x6f
 [<ffffffff8100f8af>] ? xen_restore_= fl_direct_end+0x0/0x1
 [<ffffffff8106fb64>] ? ___= _call_usermodehelper+0x113/0x11e
 [<ffffffff81013daa>] = ;? child_rip+0xa/0x20
 [<ffffffff8106fc45>] ?&nbs= p;__call_usermodehelper+0x0/0x6f
 [<ffffffff81012f91>] = ;? int_ret_from_sys_call+0x7/0x1b
 [<ffffffff8101371d>= ] ? retint_restore_args+0x5/0x6
 [<ffffffff81013da0&= gt;] ? child_rip+0x0/0x20
(XEN) Domain 0 cras= hed: 'noreboot' set - not rebooting.

 
> Date: Tue, 12 Apr 2011 06:00:00 -0400
> From: konrad.wilk@orac= le.com
> To: tinnycloud@hotmail.com
> CC: xen-devel@lists.xen= source.com; giamteckchoon@gmail.com; jeremy@goop.org
> Subject: Re:= Kernel BUG at arch/x86/mm/tlb.c:61
>
> On Tue, Apr 12, 2011= at 05:11:51PM +0800, MaoXiaoyun wrote:
> >
> > Hi :> >
> > We are using pvops kernel 2.6.32.36 + xen 4.0.1= , but confront a kernel panic bug.
> >
> > 2.6.32.36 K= ernel: http://git.kernel.org/?p=3Dlinux/kernel/git/jeremy/xen.git;a=3Dcom= mit;h=3Dbb1a15e55ec665a64c8a9c6bd699b1f16ac01ff4
> > Xen 4.0.1 h= ttp://xenbits.xen.org/hg/xen-4.0-testing.hg/rev/b536ebfba183
> >= ;
> > Our test is simple, 24 HVMS(Win2003 ) on a single host, e= ach HVM loopes in restart every 15minutes.
>
> What is the s= torage that you are using for your guests? AoE? Local disks?
>
= > > About 17 machines are invovled in the test, after 10 hours run, one confrontted a crash at arch/x86/mm/tlb.c:= 61
> >
> > Currently I am trying "cpuidle=3D0 cpufreq=3D= none" tests based on Teck's suggestion.
> >
> > Any co= mments, thanks.
> >
> > =3D=3D=3D=3D=3D=3D=3D=3D=3D=3D= =3D=3D=3D=3D=3Dcrash log=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D=3D= =3D=3D=3D=3D=3D=3D=3D=3D=3D
> > INIT: Id "s0" respawning too fas= t: disabled for 5 minutes
> > __ratelimit: 14 callbacks suppress= ed
> > blktap_sysfs_destroy
> > blktap_sysfs_destroy> > ------------[ cut here ]------------
> > kernel BUG a= t arch/x86/mm/tlb.c:61!
> > invalid opcode: 0000 [#1] SMP
&g= t; > last sysfs file: /sys/devices/system/xen_memory/xen_memory0/info/= current_kb
> > CPU 1
> > Modules linked in: 8021q garp= xen_netback xen_blkback blktap blkback_pagemap nbd bridge stp llc autofs= 4 ipmi_devintf ipmi_si ipmi_msghandler lockd sunrpc bonding ipv6 xenfs dm= _multipath video output sbs sbshc parport_pc lp pa rport ses enclosure snd_seq_dummy snd_seq_oss snd_seq_midi_event snd_seq= snd_seq_device serio_raw bnx2 snd_pcm_oss snd_mixer_oss snd_pcm snd_time= r iTCO_wdt snd soundcore snd_page_alloc i2c_i801 iTCO_vendor_support i2c_= core pcspkr pata_acpi ata_generic ata_piix shpchp mptsas mptscsih mptbase= [last unloaded: freq_table]
> > Pid: 25581, comm: khelper Not t= ainted 2.6.32.36fixxen #1 Tecal RH2285
> > RIP: e030:[<fffff= fff8103a3cb>] [<ffffffff8103a3cb>] leave_mm+0x15/0x46
> &g= t; RSP: e02b:ffff88002805be48 EFLAGS: 00010046
> > RAX: 00000000= 00000000 RBX: 0000000000000001 RCX: ffff88015f8e2da0
> > RDX: ff= ff88002805be78 RSI: 0000000000000000 RDI: 0000000000000001
> > R= BP: ffff88002805be48 R08: ffff88009d662000 R09: dead000000200200
> = > R10: dead000000100100 R11: ffffffff814472b2 R12: ffff88009bfc1880> > R13: ffff880028063020 R14: 00000000000004f6 R15: 0000000000000= 000
> > FS: 00007f62362d66e0(0000 ) GS:ffff880028058000(0000) knlGS:0000000000000000
> > CS: e033= DS: 0000 ES: 0000 CR0: 000000008005003b
> > CR2: 0000003aabc119= 09 CR3: 000000009b8ca000 CR4: 0000000000002660
> > DR0: 00000000= 00000000 DR1: 0000000000000000 DR2: 0000000000000000
> > DR3: 00= 00000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
> > P= rocess khelper (pid: 25581, threadinfo ffff88007691e000, task ffff88009b9= 2db40)
> > Stack:
> > ffff88002805be68 ffffffff8100e4ae= 0000000000000001 ffff88009d733b88
> > <0> ffff88002805be9= 8 ffffffff81087224 ffff88002805be78 ffff88002805be78
> > <0&g= t; ffff88015f808360 00000000000004f6 ffff88002805bea8 ffffffff81010108> > Call Trace:
> > <IRQ>
> > [<ffffff= ff8100e4ae>] drop_other_mm_ref+0x2a/0x53
> > [<ffffffff810= 87224>] generic_smp_call_function_single_interrupt+0xd8/0xfc
> &= gt; [<ffffffff81010108>] xen_call_fu nction_single_interrupt+0x13/0x28
> > [<ffffffff810a936a>= ] handle_IRQ_event+0x66/0x120
> > [<ffffffff810aac5b>] han= dle_percpu_irq+0x41/0x6e
> > [<ffffffff8128c1c0>] __xen_ev= tchn_do_upcall+0x1ab/0x27d
> > [<ffffffff8128dd11>] xen_ev= tchn_do_upcall+0x33/0x46
> > [<ffffffff81013efe>] xen_do_h= ypervisor_callback+0x1e/0x30
> > <EOI>
> > [<= ffffffff814472b2>] ? _spin_unlock_irqrestore+0x15/0x17
> > [&= lt;ffffffff8100f8cf>] ? xen_restore_fl_direct_end+0x0/0x1
> >= [<ffffffff81113f71>] ? flush_old_exec+0x3ac/0x500
> > [&l= t;ffffffff81150dc5>] ? load_elf_binary+0x0/0x17ef
> > [<ff= ffffff81150dc5>] ? load_elf_binary+0x0/0x17ef
> > [<ffffff= ff8115115d>] ? load_elf_binary+0x398/0x17ef
> > [<ffffffff= 81042fcf>] ? need_resched+0x23/0x2d
> > [<ffffffff811f4648= >] ? process_measurement+0xc0/0xd7
& gt; > [<ffffffff81150dc5>] ? load_elf_binary+0x0/0x17ef
>= > [<ffffffff81113094>] ? search_binary_handler+0xc8/0x255
&g= t; > [<ffffffff81114362>] ? do_execve+0x1c3/0x29e
> > [= <ffffffff8101155d>] ? sys_execve+0x43/0x5d
> > [<ffffff= ff8106fc45>] ? __call_usermodehelper+0x0/0x6f
> > [<ffffff= ff81013e28>] ? kernel_execve+0x68/0xd0
> > [<ffffffff8106f= c45>] ? __call_usermodehelper+0x0/0x6f
> > [<ffffffff8100f= 8cf>] ? xen_restore_fl_direct_end+0x0/0x1
> > [<ffffffff81= 06fb64>] ? ____call_usermodehelper+0x113/0x11e
> > [<fffff= fff81013daa>] ? child_rip+0xa/0x20
> > [<ffffffff8106fc45&= gt;] ? __call_usermodehelper+0x0/0x6f
> > [<ffffffff81012f91&= gt;] ? int_ret_from_sys_call+0x7/0x1b
> > [<ffffffff8101371d&= gt;] ? retint_restore_args+0x5/0x6
> > [<ffffffff81013da0>= ] ? child_rip+0x0/0x20
> > Code:=20 41 5e 41 5f c9 c3 55 48 89 e5 0f 1f 44 00 00 e8 17 ff ff ff c9 c3 55 48 = 89 e5 0f 1f 44 00 00 65 8b 04 25 c8 55 01 00 ff c8 75 04 <0f> 0b eb= fe 65 48 8b 34 25 c0 55 01 00 48 81 c6 b8 02 00 00 e8
> > RIP = [<ffffffff8103a3cb>] leave_mm+0x15/0x46
> > RSP <ffff88= 002805be48>
> > ---[ end trace ce9cee6832a9c503 ]---
> = > Kernel panic - not syncing: Fatal exception in interrupt
> >= ; Pid: 25581, comm: khelper Tainted: G D 2.6.32.36fixxen #1
> > = Call Trace:
> > <IRQ> [<ffffffff8105682e>] panic+0xe= 0/0x19a
> > [<ffffffff8144008a>] ? init_amd+0x296/0x37a> > [<ffffffff8100f17d>] ? xen_force_evtchn_callback+0xd/0xf=
> > [<ffffffff8100f8e2>] ? check_events+0x12/0x20
>= > [<ffffffff8100f8cf>] ? xen_restore_fl_direct_end+0x0/0x1
&= gt; > [<ffffffff81056487>] ? print_oops_end_marker+0x23/0x25
= > > [<ffffffff81448185>] oops_ end+0xb6/0xc6
> > [<ffffffff810166e5>] die+0x5a/0x63
&= gt; > [<ffffffff81447a5c>] do_trap+0x115/0x124
> > [<= ;ffffffff810148e6>] do_invalid_op+0x9c/0xa5
> > [<ffffffff= 8103a3cb>] ? leave_mm+0x15/0x46
> > [<ffffffff8100f6fa>= ] ? xen_clocksource_read+0x21/0x23
> > [<ffffffff8100f26c>= ] ? HYPERVISOR_vcpu_op+0xf/0x11
> > [<ffffffff8100f767>] ?= xen_vcpuop_set_next_event+0x52/0x67
> > [<ffffffff81080bfa&g= t;] ? clockevents_program_event+0x78/0x81
> > [<ffffffff81013= b3b>] invalid_op+0x1b/0x20
> > [<ffffffff814472b2>] ? _= spin_unlock_irqrestore+0x15/0x17
> > [<ffffffff8103a3cb>] = ? leave_mm+0x15/0x46
> > [<ffffffff8100e4ae>] drop_other_m= m_ref+0x2a/0x53
> > [<ffffffff81087224>] generic_smp_call_= function_single_interrupt+0xd8/0xfc
> > [<ffffffff81010108>= ;] xen_call_function_single_interrupt+0x13 /0x28
> > [<ffffffff810a936a>] handle_IRQ_event+0x66/0x12= 0
> > [<ffffffff810aac5b>] handle_percpu_irq+0x41/0x6e
= > > [<ffffffff8128c1c0>] __xen_evtchn_do_upcall+0x1ab/0x27d> > [<ffffffff8128dd11>] xen_evtchn_do_upcall+0x33/0x46
= > > [<ffffffff81013efe>] xen_do_hypervisor_callback+0x1e/0x30=
> > <EOI> [<ffffffff814472b2>] ? _spin_unlock_irqre= store+0x15/0x17
> > [<ffffffff8100f8cf>] ? xen_restore_fl_= direct_end+0x0/0x1
> > [<ffffffff81113f71>] ? flush_old_ex= ec+0x3ac/0x500
> > [<ffffffff81150dc5>] ? load_elf_binary+= 0x0/0x17ef
> > [<ffffffff81150dc5>] ? load_elf_binary+0x0/= 0x17ef
> > [<ffffffff8115115d>] ? load_elf_binary+0x398/0x= 17ef
> > [<ffffffff81042fcf>] ? need_resched+0x23/0x2d
= > > [<ffffffff811f4648>] ? process_measurement+0xc0/0xd7
&= gt; > [<ffffffff81150dc5>] ? load _elf_binary+0x0/0x17ef
> > [<ffffffff81113094>] ? search_= binary_handler+0xc8/0x255
> > [<ffffffff81114362>] ? do_ex= ecve+0x1c3/0x29e
> > [<ffffffff8101155d>] ? sys_execve+0x4= 3/0x5d
> > [<ffffffff8106fc45>] ? __call_usermodehelper+0x= 0/0x6f
> > [<ffffffff81013e28>] ? kernel_execve+0x68/0xd0<= BR>> > [<ffffffff8106fc45>] ? __call_usermodehelper+0x0/0x6f<= BR>> > [<ffffffff8100f8cf>] ? xen_restore_fl_direct_end+0x0/0= x1
> > [<ffffffff8106fb64>] ? ____call_usermodehelper+0x11= 3/0x11e
> > [<ffffffff81013daa>] ? child_rip+0xa/0x20
&= gt; > [<ffffffff8106fc45>] ? __call_usermodehelper+0x0/0x6f
&= gt; > [<ffffffff81012f91>] ? int_ret_from_sys_call+0x7/0x1b
&= gt; > [<ffffffff8101371d>] ? retint_restore_args+0x5/0x6
>= > [<ffffffff81013da0>] ? child_rip+0x0/0x20
> >
&g= t; >
--_702121fa-b4c8-4aa3-b55a-69720ad5fc06_-- --===============0760198219== Content-Type: text/plain; charset="us-ascii" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit Content-Disposition: inline _______________________________________________ Xen-devel mailing list Xen-devel@lists.xensource.com http://lists.xensource.com/xen-devel --===============0760198219==--