<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:07:33 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-489] Hyperion-mds1 - swraid crash in mkfs.lustre</title>
                <link>https://jira.whamcloud.com/browse/LU-489</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Ran command:&lt;br/&gt;
#mkfs.lustre --reformat --mgs --mdt --fsname lustre /dev/md0&lt;/p&gt;

&lt;p&gt;Result:&lt;br/&gt;
---------------&lt;/p&gt;

&lt;p&gt;2011-07-05 16:25:34 hyperion-mds1 login: ----------- &lt;span class=&quot;error&quot;&gt;&amp;#91;cut here &amp;#93;&lt;/span&gt; --------- &lt;span class=&quot;error&quot;&gt;&amp;#91;please bite here &amp;#93;&lt;/span&gt; ---------&lt;br/&gt;
2011-07-05 16:26:50 Kernel BUG at fs/bio.c:222&lt;br/&gt;
2011-07-05 16:26:50 invalid opcode: 0000 &lt;span class=&quot;error&quot;&gt;&amp;#91;1&amp;#93;&lt;/span&gt; SMP &lt;br/&gt;
2011-07-05 16:26:50 last sysfs file: /devices/pci0000:00/0000:00:0d.0/0000:05:00.0/0000:06:03.1/irq&lt;br/&gt;
2011-07-05 16:26:50 CPU 11 &lt;br/&gt;
2011-07-05 16:26:50 Modules linked in: ext4(U) ldiskfs(U) jbd2(U) crc16(U) lustre(U) lov(U) mdc(U) lquota(U) osc(U) ptlrpc(U) obdclass(U) lvfs(U) ko2iblnd(U) lnet(U) libcfs(U) ib_srp(U) ib_ipoib(U) rdma_ucm(U) rdma_cm(U) iw_cm(U) ib_addr(U) ib_ucm(U) ib_uverbs(U) ib_umad(U) mlx4_ib(U) mlx4_core(U) ipoib_helper(U) ib_cm(U) ib_sa(U) ib_mad(U) ib_core(U) ipv6(U) xfrm_nalgo(U) crypto_api(U) dm_mirror(U) dm_log(U) dm_multipath(U) scsi_dh(U) dm_mod(U) raid10(U) video(U) backlight(U) sbs(U) power_meter(U) i2c_ec(U) dell_wmi(U) wmi(U) button(U) battery(U) asus_acpi(U) acpi_memhotplug(U) ac(U) parport_pc(U) lp(U) parport(U) sd_mod(U) sg(U) floppy(U) mptsas(U) mptscsih(U) sata_nv(U) mptbase(U) i2c_nforce2(U) pcspkr(U) libata(U) ohci_hcd(U) i2c_core(U) k10temp(U) scsi_transport_sas(U) amd64_edac_mod(U) hwmon(U) tpm_tis(U) scsi_mod(U) edac_mc(U) shpchp(U) tpm(U) tpm_bios(U) serio_raw(U) ide_cd(U) cdrom(U) nfs(U) nfs_acl(U) lockd(U) fscache(U) sunrpc(U) e1000(U)&lt;br/&gt;
2011-07-05 16:26:50 Pid: 36, comm: ksoftirqd/11 Tainted: G      2.6.18-238.12.1.el5_lustre.g266a955 #1&lt;br/&gt;
2011-07-05 16:26:50 RIP: 0010:&lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8002e266&amp;gt;&amp;#93;&lt;/span&gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8002e266&amp;gt;&amp;#93;&lt;/span&gt; bio_put+0xa/0x32&lt;br/&gt;
2011-07-05 16:26:50 RSP: 0000:ffff810138df3db0  EFLAGS: 00010246&lt;br/&gt;
2011-07-05 16:26:50 RAX: 0000000000000000 RBX: ffff811032cb7d80 RCX: ffff813770b8bec0&lt;br/&gt;
2011-07-05 16:26:50 RDX: ffff8124f07f7d40 RSI: ffff810f6dab3b40 RDI: ffff8124f07f7d40&lt;br/&gt;
2011-07-05 16:26:50 RBP: ffff813770b8bf18 R08: 0000000000001000 R09: ffff811032cb7e10&lt;br/&gt;
2011-07-05 16:26:50 R10: ffff81206d101d88 R11: ffffffff800452a8 R12: ffff813770b8bec0&lt;br/&gt;
2011-07-05 16:26:50 R13: 0000000000000001 R14: 0000000000001000 R15: 00000000000c3000&lt;br/&gt;
2011-07-05 16:26:50 FS:  00002aaaabc8fb50(0000) GS:ffff8120381ab2c0(0000) knlGS:0000000000000000&lt;br/&gt;
2011-07-05 16:26:50 CS:  0010 DS: 0018 ES: 0018 CR0: 000000008005003b&lt;br/&gt;
2011-07-05 16:26:50 CR2: 00002aaaaace2b80 CR3: 0000002036af0000 CR4: 00000000000006e0&lt;br/&gt;
2011-07-05 16:26:50 Process ksoftirqd/11 (pid: 36, threadinfo ffff8120381c6000, task ffff81103819c040)&lt;br/&gt;
2011-07-05 16:26:50 Stack:  ffffffff88383abc 0000000000000002 ffff813770b8bec0 0000000000000002&lt;br/&gt;
2011-07-05 16:26:50  ffff811032cb7d80 0000000013730d08 ffffffff883857bb ffff8125a30636c0&lt;br/&gt;
2011-07-05 16:26:50  ffff811037f2edc0 ffff8124507f7d40 ffff8110334066b0 ffff8130326104e8&lt;br/&gt;
2011-07-05 16:26:50 Call Trace:&lt;br/&gt;
2011-07-05 16:26:50  &amp;lt;IRQ&amp;gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88383abc&amp;gt;&amp;#93;&lt;/span&gt; :raid10:raid_end_bio_io+0x59/0x80&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff883857bb&amp;gt;&amp;#93;&lt;/span&gt; :raid10:raid10_end_write_request+0xe6/0x126&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8002cecb&amp;gt;&amp;#93;&lt;/span&gt; __end_that_request_first+0x23c/0x5bf&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005c444&amp;gt;&amp;#93;&lt;/span&gt; blk_run_queue+0x41/0x72&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff881491f2&amp;gt;&amp;#93;&lt;/span&gt; :scsi_mod:scsi_end_request+0x27/0xcd&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff881493e6&amp;gt;&amp;#93;&lt;/span&gt; :scsi_mod:scsi_io_completion+0x14e/0x324&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff882b10f0&amp;gt;&amp;#93;&lt;/span&gt; :sd_mod:sd_rw_intr+0x25a/0x294&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8814967b&amp;gt;&amp;#93;&lt;/span&gt; :scsi_mod:scsi_device_unbusy+0x67/0x81&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff80037fa0&amp;gt;&amp;#93;&lt;/span&gt; blk_done_softirq+0x5f/0x6d&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff80012515&amp;gt;&amp;#93;&lt;/span&gt; __do_softirq+0x89/0x133&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005e2fc&amp;gt;&amp;#93;&lt;/span&gt; call_softirq+0x1c/0x28&lt;br/&gt;
2011-07-05 16:26:50  &amp;lt;EOI&amp;gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff800963b1&amp;gt;&amp;#93;&lt;/span&gt; ksoftirqd+0x0/0xbf&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8006d5f5&amp;gt;&amp;#93;&lt;/span&gt; do_softirq+0x2c/0x7d&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff80096410&amp;gt;&amp;#93;&lt;/span&gt; ksoftirqd+0x5f/0xbf&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff80032b1e&amp;gt;&amp;#93;&lt;/span&gt; kthread+0xfe/0x132&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfb1&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x11&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff80032a20&amp;gt;&amp;#93;&lt;/span&gt; kthread+0x0/0x132&lt;br/&gt;
2011-07-05 16:26:50  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfa7&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0x0/0x11&lt;br/&gt;
2011-07-05 16:26:50 &lt;br/&gt;
2011-07-05 16:26:50 &lt;br/&gt;
2011-07-05 16:26:50 Code: 0f 0b 68 24 a9 2b 80 c2 de 00 f0 ff 4a 50 0f 94 c0 84 c0 74 &lt;br/&gt;
2011-07-05 16:26:50 RIP  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8002e266&amp;gt;&amp;#93;&lt;/span&gt; bio_put+0xa/0x32&lt;br/&gt;
2011-07-05 16:26:50  RSP &amp;lt;ffff810138df3db0&amp;gt;&lt;br/&gt;
2011-07-05 16:26:50 REWRITING MCP55 CFG REG&lt;br/&gt;
2011-07-05 16:26:50 CFG = c1&lt;br/&gt;
2011-07-05 16:26:50 Linux version 2.6.18-238.12.1.el5_lustre.g266a955 (jenkins@rhel5-64-build.lab.whamcloud.com) (gcc version 4.1.2 20080704 (Red Hat 4.1.2-50)) #1 SMP Fri Jun 10 16:39:27 PDT 2011&lt;/p&gt;


&lt;p&gt;Has occurred now 6 times, easy to reproduce. &lt;/p&gt;</description>
                <environment>Hyperion chaos distribute Linux version 2.6.18-238.12.1.el5_lustre.g266a955 (&lt;a href=&apos;mailto:jenkins@rhel5-64-build.lab.whamcloud.com&apos;&gt;jenkins@rhel5-64-build.lab.whamcloud.com&lt;/a&gt;) (gcc version 4.1.2 20080704 (Red Hat 4.1.2-50)) #1 SMP Fri Jun 10 16:39:27 PDT 2011                </environment>
        <key id="11283">LU-489</key>
            <summary>Hyperion-mds1 - swraid crash in mkfs.lustre</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="cliffw">Cliff White</reporter>
                        <labels>
                    </labels>
                <created>Tue, 5 Jul 2011 19:45:58 +0000</created>
                <updated>Wed, 1 Jul 2015 16:15:43 +0000</updated>
                            <resolved>Wed, 1 Jul 2015 16:15:43 +0000</resolved>
                                    <version>Lustre 1.8.6</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="17270" author="cliffw" created="Tue, 5 Jul 2011 21:08:59 +0000"  >&lt;p&gt;Also worth noting - the MDS is the only node using the mptbase and mptsas drivers. - The OSSs are HW (DDN) and &lt;br/&gt;
do not have those cards.&lt;/p&gt;</comment>
                            <comment id="17271" author="cliffw" created="Tue, 5 Jul 2011 22:47:09 +0000"  >&lt;p&gt;I built a new image, based on chaos 4.4-2 - Installed the same RPMS, had the same crash. I repeated the test with the image from last week, &lt;br/&gt;
with kernel vmlinuz-2.6.18-238.12.1.el5_lustre.g266a955, and the crash did not repeat.&lt;/p&gt;</comment>
                            <comment id="17272" author="cliffw" created="Tue, 5 Jul 2011 22:53:52 +0000"  >&lt;p&gt;sorry, pasted wrong version - the non-crashing kernel is vmlinuz-2.6.18-238.12.1.el5_lustre.g529529a&lt;/p&gt;</comment>
                            <comment id="17327" author="pjones" created="Wed, 6 Jul 2011 17:45:47 +0000"  >&lt;p&gt;Yang Sheng&lt;/p&gt;

&lt;p&gt;Do you see anything in the raid patches in our patch series for the latest rhel kernel that might explain this?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="17361" author="johann" created="Thu, 7 Jul 2011 05:57:53 +0000"  >&lt;p&gt;All those kernels should be the same. The version string has changed just because i enabled/disabled slab debugging.&lt;br/&gt;
Yangsheng, do we patch some common code which could be used by RAID10 too?&lt;br/&gt;
Cliff, any chance to try with a stock Redhat kernel?&lt;/p&gt;</comment>
                            <comment id="17374" author="ys" created="Thu, 7 Jul 2011 09:57:45 +0000"  >&lt;p&gt;I cannot make sure our patches whether cause this kind of issue. But i think we can test without our raid patches to ensure they aren&apos;t crash the kernel. &lt;/p&gt;</comment>
                            <comment id="17385" author="cliffw" created="Thu, 7 Jul 2011 13:47:19 +0000"  >&lt;p&gt;I don&apos;t know what I would test with a stock kernel - the issue is a failure triggered buy running mkfs.lustre, and I cannot do this with a stock kernel. mkfs -t ext3 and mkfs -t ext4 have been tested on all these kernels, and do not fail. Please explain what tests you wish run with a stock kernel, and I&apos;ll see about finding the bits. &lt;/p&gt;</comment>
                            <comment id="17389" author="johann" created="Thu, 7 Jul 2011 16:41:11 +0000"  >&lt;p&gt;Have you tried with a simple dd? In any casse, mkfs.lustre does not require to load the kernel module, so you should be able to run it on an unpatched kernel.&lt;/p&gt;</comment>
                            <comment id="120058" author="ys" created="Wed, 1 Jul 2015 16:13:00 +0000"  >&lt;p&gt;Can we close this one? Looks like it just hit on rhel5 kernel.&lt;/p&gt;</comment>
                            <comment id="120059" author="cliffw" created="Wed, 1 Jul 2015 16:15:43 +0000"  >&lt;p&gt;Might as well close, we haven&apos;t hit it again&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw387:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10607</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10023"><![CDATA[4]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>