<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:14:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1232] Input/Output error during large lun test</title>
                <link>https://jira.whamcloud.com/browse/LU-1232</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Running large lun with 24T OST on Juelich cluster, got this error when running llverfs in full mode on the OST ldiskfs filesystem &lt;/p&gt;

&lt;p&gt;write filename: /mnt/ost1/dir00157/file025, current 787.039 MB/s, overall 100.624 MB/s, est 4294967248:4294967257:4294967237 left&lt;br/&gt;
write filename: /mnt/ost1/dir00157/file026, current 794.458 MB/s, overall 100.642 MB/s, est 4294967248:4294967252:429496724&lt;br/&gt;
llverfs: Open &apos;/mnt/ost1/dir00172/file002&apos; failed:Input/output error&lt;/p&gt;


&lt;p&gt;Please see the attached for console log and dmesg.&lt;/p&gt;</description>
                <environment>2.2-RC1-RHEL6 server and client</environment>
        <key id="13608">LU-1232</key>
            <summary>Input/Output error during large lun test</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="sarah">Sarah Liu</reporter>
                        <labels>
                    </labels>
                <created>Mon, 19 Mar 2012 02:26:55 +0000</created>
                <updated>Wed, 21 Mar 2012 12:53:58 +0000</updated>
                            <resolved>Wed, 21 Mar 2012 10:17:36 +0000</resolved>
                                    <version>Lustre 2.2.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="31510" author="pjones" created="Mon, 19 Mar 2012 16:48:46 +0000"  >&lt;p&gt;Yangsheng&lt;/p&gt;


&lt;p&gt;Could you please advise on tihs one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="31571" author="ys" created="Tue, 20 Mar 2012 06:56:49 +0000"  >&lt;p&gt;This issue looks like cause by a hardware problem.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;sd 6:0:27:0: rejecting I/O to offline device
LDISKFS-fs error (device dm-1): ldiskfs_find_entry: reading directory #22708225 offset 0
sd 6:0:27:0: rejecting I/O to offline device
LDISKFS-fs error (device dm-1): ldiskfs_read_inode_bitmap: Cannot read inode bitmap - block_group = 177408, inode_bitmap = 5813305600
LDISKFS-fs error (device dm-1) in ldiskfs_new_inode: IO failure
sd 6:0:27:0: rejecting I/O to offline device
LDISKFS-fs (dm-1): delayed block allocation failed for inode 22544416 at logical offset 995328 with max blocks 2048 with error -5

This should not happen!!  Data will be lost
JBD2: Detected IO errors while flushing file data on dm-1-8
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="31597" author="sarah" created="Tue, 20 Mar 2012 12:47:35 +0000"  >&lt;p&gt;I reran this test in partial mode, failed again. Please see the attached for console log and demsg.&lt;/p&gt;</comment>
                            <comment id="31602" author="ys" created="Tue, 20 Mar 2012 13:37:41 +0000"  >&lt;p&gt;From demsg_partial, it is very obvious a storage error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Buffer I/O error on device dm-0, logical block 65598925
lost page write due to I/O error on dm-0
sd 6:0:22:0: [sdu] Unhandled error code
sd 6:0:22:0: [sdu] Result: hostbyte=DID_NO_CONNECT driverbyte=DRIVER_OK
sd 6:0:22:0: [sdu] CDB: Write(10): 2a 00 1f 61 89 08 00 00 08 00
end_request: I/O error, dev sdu, sector 526485768
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I&apos;ll look into RHEL6 bugzilla trying to found if has this kind issue with this driver.&lt;/p&gt;

&lt;p&gt;mpt2sas0: LSISAS2008: FWVersion(11.00.00.00), ChipRevision(0x03), BiosVersion(07.21.00.00)&lt;/p&gt;

&lt;p&gt;Thanks for the whole dmesg log.&lt;/p&gt;</comment>
                            <comment id="31620" author="sarah" created="Tue, 20 Mar 2012 19:35:37 +0000"  >&lt;p&gt;I try to install tag-2.1.56 build again and got following error:&lt;br/&gt;
-------------------&lt;br/&gt;
BUG: unable to handle kernel NULL pointer dereference at 0000000000000006&lt;br/&gt;
IP: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f01&amp;gt;&amp;#93;&lt;/span&gt; ses_intf_add+0x2f1/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
PGD 630ec3067 PUD 631ed5067 PMD 0 &lt;br/&gt;
Oops: 0000 &lt;a href=&quot;#1&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;1&lt;/a&gt; SMP &lt;br/&gt;
last sysfs file: /sys/devices/pci0000:00/0000:00:01.0/0000:01:00.1/device&lt;br/&gt;
CPU 0 &lt;br/&gt;
Modules linked in: ses&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; enclosure mlx4_ib ib_mad ib_core mlx4_en mlx4_core scsi_wait_scan&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; igb iTCO_wdt i2c_i801&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; i2c_core i7core_edac&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; ioatdma&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; iTCO_vendor_support dca edac_core microcode serio_raw shpchp&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; ext3 jbd mbcache sd_mod crc_t10dif mpt2sas&lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/add.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt; scsi_transport_sas raid_class ahci dm_mirror dm_region_hash dm_log dm_mod&lt;/p&gt;

&lt;p&gt;Pid: 2080, comm: modprobe Not tainted 2.6.32-220.4.2.el6_lustre.gddd1a7c.x86_64 #1 SGI.COM C1104-2TY9/X8DTT-IBQF&lt;br/&gt;
RIP: 0010:&lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f01&amp;gt;&amp;#93;&lt;/span&gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f01&amp;gt;&amp;#93;&lt;/span&gt; ses_intf_add+0x2f1/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
RSP: 0018:ffff8803340bfe38  EFLAGS: 00010246&lt;br/&gt;
RAX: ffff88032db03800 RBX: ffff88032f5ae800 RCX: 0000000000000017&lt;br/&gt;
RDX: 0000000000000000 RSI: ffffffff8126cdd0 RDI: 0000000000000000&lt;br/&gt;
RBP: ffff8803340bfe98 R08: ffffffff81c00280 R09: 0000000000000000&lt;br/&gt;
R10: 0000000000000000 R11: 0000000000000000 R12: ffff880637d78920&lt;br/&gt;
R13: 0000000000000000 R14: ffff880330ec0400 R15: ffff88063006cdc0&lt;br/&gt;
FS:  00007f9665162700(0000) GS:ffff880028200000(0000) knlGS:0000000000000000&lt;br/&gt;
CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b&lt;br/&gt;
CR2: 0000000000000006 CR3: 0000000637094000 CR4: 00000000000006f0&lt;br/&gt;
DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000&lt;br/&gt;
DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400&lt;br/&gt;
Process modprobe (pid: 2080, threadinfo ffff8803340be000, task ffff880336dd74c0)&lt;br/&gt;
Stack:&lt;br/&gt;
 ffff8803340bfe78 ffffffff814d3aef ffff880330048800 ffff88032f5aeb58&lt;br/&gt;
&amp;lt;0&amp;gt; ffff88032f5ae938 0000000000000010 0000000000000000 ffffffffa00ba460&lt;br/&gt;
&amp;lt;0&amp;gt; ffffffff81b01ee0 ffff8803340bfea8 0000000000000000 0000000000000000&lt;br/&gt;
Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814d3aef&amp;gt;&amp;#93;&lt;/span&gt; ? klist_next+0x7f/0xf0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81347599&amp;gt;&amp;#93;&lt;/span&gt; class_interface_register+0xa9/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00fe000&amp;gt;&amp;#93;&lt;/span&gt; ? ses_init+0x0/0x3c &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81367366&amp;gt;&amp;#93;&lt;/span&gt; scsi_register_interface+0x16/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00fe014&amp;gt;&amp;#93;&lt;/span&gt; ses_init+0x14/0x3c &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100204c&amp;gt;&amp;#93;&lt;/span&gt; do_one_initcall+0x3c/0x1d0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810af4e1&amp;gt;&amp;#93;&lt;/span&gt; sys_init_module+0xe1/0x250&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100b0f2&amp;gt;&amp;#93;&lt;/span&gt; system_call_fastpath+0x16/0x1b&lt;br/&gt;
Code: 29 e1 48 85 c0 75 13 eb 51 90 48 8b 3b 48 89 c6 e8 d5 f0 29 e1 48 85 c0 74 40 8b b8 84 00 00 00 85 ff 75 e6 48 8b 90 a8 00 00 00 &amp;lt;f6&amp;gt; 42 06 40 75 d9 48 89 c6 4c 89 f7 48 89 45 b0 e8 aa fa ff ff &lt;br/&gt;
RIP  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f01&amp;gt;&amp;#93;&lt;/span&gt; ses_intf_add+0x2f1/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 RSP &amp;lt;ffff8803340bfe38&amp;gt;&lt;br/&gt;
CR2: 0000000000000006&lt;br/&gt;
--&lt;del&gt;[ end trace c653e9e779d07a3e ]&lt;/del&gt;--&lt;br/&gt;
Kernel panic - not syncing: Fatal exception&lt;br/&gt;
Pid: 2080, comm: modprobe Tainted: G      D    ----------------   2.6.32-220.4.2.el6_lustre.gddd1a7c.x86_64 #1&lt;br/&gt;
Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ec61a&amp;gt;&amp;#93;&lt;/span&gt; ? panic+0x78/0x143&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814f07a4&amp;gt;&amp;#93;&lt;/span&gt; ? oops_end+0xe4/0x100&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104234b&amp;gt;&amp;#93;&lt;/span&gt; ? no_context+0xfb/0x260&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffffff81250984&amp;gt;&amp;#93;&lt;/span&gt; ?3&amp;gt;] ? __do_page_ft+0x49/0x60&lt;br/&gt;
 [&amp;lt;f0x190&lt;br/&gt;
 [&amp;lt;ffffffge_fault+0x25/0x30&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8126cdd0&amp;gt;&amp;#93;&lt;/span&gt; ? kobject_release+0x0/0x240&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f01&amp;gt;&amp;#93;&lt;/span&gt; ? ses_intf_add+0x2f1/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00b9f25&amp;gt;&amp;#93;&lt;/span&gt; ? ses_intf_add+0x315/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814d3aef&amp;gt;&amp;#93;&lt;/span&gt; ? klist_next+0x7f/0xf0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81347599&amp;gt;&amp;#93;&lt;/span&gt; ? class_interface_register+0xa9/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00fe000&amp;gt;&amp;#93;&lt;/span&gt; ? ses_init+0x0/0x3c &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81367366&amp;gt;&amp;#93;&lt;/span&gt; ? scsi_register_interface+0x16/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00fe014&amp;gt;&amp;#93;&lt;/span&gt; ? ses_init+0x14/0x3c &lt;span class=&quot;error&quot;&gt;&amp;#91;ses&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100204c&amp;gt;&amp;#93;&lt;/span&gt; ? do_one_initcall+0x3c/0x1d0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810af4e1&amp;gt;&amp;#93;&lt;/span&gt; ? sys_init_module+0xe1/0x250&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100b0f2&amp;gt;&amp;#93;&lt;/span&gt; ? system_call_fastpath+0x16/0x1b&lt;/p&gt;</comment>
                            <comment id="31686" author="heckes" created="Wed, 21 Mar 2012 10:04:19 +0000"  >&lt;p&gt;Hi Sarah,&lt;/p&gt;

&lt;p&gt;you&apos;re right, two disks of the pool assigned the OSS nodes are broken:&lt;/p&gt;

&lt;p&gt;ID 5000c50040cf7d9d     /dev/sdu     ST2000NM0001 (2TB disk)&lt;br/&gt;
ID 5000c50034003265     /dev/sdz     ST33000650SS (3TB disk)&lt;/p&gt;

&lt;p&gt;I removed them from the JBOD. Could you remove them from the autotest resource file, till we receive the spare parts?&lt;/p&gt;

&lt;p&gt;These are too many HW failures in 3 month for such a little environment. I&apos;ll try to get in touch with our supplier whether there&apos;s a quality issue with the disks or maybe some problem with MPT driver, disk firmware or ...&lt;br/&gt;
I&apos;m very sorry for the delay caused by these failures. &lt;/p&gt;</comment>
                            <comment id="31701" author="pjones" created="Wed, 21 Mar 2012 10:17:36 +0000"  >&lt;p&gt;Thanks Frank. I am closing this ticket because it is now clear that it is not related to a Lustre software issue.&lt;/p&gt;</comment>
                            <comment id="31761" author="sarah" created="Wed, 21 Mar 2012 12:53:58 +0000"  >&lt;p&gt;Thanks Frank, I will remove them from the script.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="10963" name="dmesg" size="491540" author="sarah" created="Mon, 19 Mar 2012 02:31:54 +0000"/>
                            <attachment id="10978" name="dmesg_partial" size="487739" author="sarah" created="Tue, 20 Mar 2012 12:47:55 +0000"/>
                            <attachment id="10964" name="large_lun.log" size="565108" author="sarah" created="Mon, 19 Mar 2012 02:31:54 +0000"/>
                            <attachment id="10979" name="large_lun_partial.log" size="224850" author="sarah" created="Tue, 20 Mar 2012 12:47:55 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvh5z:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6430</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>