<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:10:19 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-7602] Repeated timeouts with ZFS 0.6.5.2</title>
                <link>https://jira.whamcloud.com/browse/LU-7602</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This bug created to track activity from &lt;a href=&quot;http://review.whamcloud.com/17712&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/17712&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-7602&quot; title=&quot;Repeated timeouts with ZFS 0.6.5.2&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-7602&quot;&gt;&lt;del&gt;LU-7602&lt;/del&gt;&lt;/a&gt; zfs: reset ZFS baseline to 0.6.4.2&lt;/p&gt;

&lt;p&gt;ZFS 0.6.5.2 is known to introduce I/O problems&lt;br/&gt;
Typical timeout - slightly different from the stack traces in the Gerrit ticket&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;Dec 23 11:47:33 iws2 kernel: LNet: Service thread pid 30734 was inactive &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; 200.00s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; debugging purposes:
Dec 23 11:47:33 iws2 kernel: Pid: 30734, comm: ll_ost00_000
Dec 23 11:47:33 iws2 kernel:
Dec 23 11:47:33 iws2 kernel: Call Trace:
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa06cb330&amp;gt;] ? vdev_mirror_child_done+0x0/0x30 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff815395d3&amp;gt;] io_schedule+0x73/0xc0
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa05a3eaf&amp;gt;] cv_wait_common+0xaf/0x130 [spl]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff810a1460&amp;gt;] ? autoremove_wake_function+0x0/0x40
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa05a3f48&amp;gt;] __cv_wait_io+0x18/0x20 [spl]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa070c29b&amp;gt;] zio_wait+0x10b/0x1e0 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa06638a9&amp;gt;] dbuf_read+0x439/0x850 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa066c168&amp;gt;] dmu_buf_hold+0x68/0x90 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa0661fa8&amp;gt;] ? dbuf_rele_and_unlock+0x268/0x390 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa06d5e0a&amp;gt;] zap_lockdir+0x5a/0x770 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa06d797a&amp;gt;] zap_lookup_norm+0x4a/0x190 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa06d7b53&amp;gt;] zap_lookup+0x33/0x40 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa067bbe6&amp;gt;] dmu_tx_hold_zap+0x146/0x210 [zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa107b3b5&amp;gt;] osd_declare_object_create+0x2d5/0x440 [osd_zfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa11bba24&amp;gt;] ofd_precreate_objects+0x4e4/0x19d0 [ofd]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa04bc6c1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa11c8bdb&amp;gt;] ? ofd_grant_create+0x23b/0x3e0 [ofd]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa11ab83e&amp;gt;] ofd_create_hdl+0x56e/0x2640 [ofd]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa0bbefe0&amp;gt;] ? lustre_pack_reply_v2+0x220/0x280 [ptlrpc]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa0c294cc&amp;gt;] tgt_request_handle+0x8ec/0x1470 [ptlrpc]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa0bd0b41&amp;gt;] ptlrpc_main+0xe41/0x1910 [ptlrpc]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffffa0bcfd00&amp;gt;] ? ptlrpc_main+0x0/0x1910 [ptlrpc]
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff810a0fce&amp;gt;] kthread+0x9e/0xc0
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff8100c28a&amp;gt;] child_rip+0xa/0x20
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff810a0f30&amp;gt;] ? kthread+0x0/0xc0
Dec 23 11:47:33 iws2 kernel: [&amp;lt;ffffffff8100c280&amp;gt;] ? child_rip+0x0/0x20
Dec 23 11:47:33 iws2 kernel:
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>Hyperion/SWL - </environment>
        <key id="33838">LU-7602</key>
            <summary>Repeated timeouts with ZFS 0.6.5.2</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="yujian">Jian Yu</assignee>
                                    <reporter username="cliffw">Cliff White</reporter>
                        <labels>
                    </labels>
                <created>Wed, 23 Dec 2015 19:54:55 +0000</created>
                <updated>Wed, 23 Dec 2015 21:30:26 +0000</updated>
                            <resolved>Wed, 23 Dec 2015 21:28:27 +0000</resolved>
                                    <version>Lustre 2.8.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="137324" author="yujian" created="Wed, 23 Dec 2015 20:36:38 +0000"  >&lt;p&gt;Hi Cliff,&lt;/p&gt;

&lt;p&gt;Patch &lt;a href=&quot;http://review.whamcloud.com/17712&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/17712&lt;/a&gt; hit build failure on sles11sp2 server. I created TEI-4369 to disable the build.&lt;/p&gt;

&lt;p&gt;In the meantime, since builds on other distros passed, could you please verify whether the timeout issue is resolved or not after resetting ZFS baseline to 0.6.4.2? Thank you.&lt;/p&gt;</comment>
                            <comment id="137334" author="adilger" created="Wed, 23 Dec 2015 21:04:00 +0000"  >&lt;p&gt;Cliff, do you have the stack traces for all the threads on the OSS?  It seems this &lt;tt&gt;ll_ost00_000&lt;/tt&gt; thread is waiting for the ZFS TXG to commit, but it would be useful to know what the other threads are doing in the meantime.&lt;/p&gt;</comment>
                            <comment id="137343" author="adilger" created="Wed, 23 Dec 2015 21:28:27 +0000"  >&lt;p&gt;Closing this as a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-7404&quot; title=&quot;ZFS OSS - Numerous timeouts - SWL&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-7404&quot;&gt;&lt;del&gt;LU-7404&lt;/del&gt;&lt;/a&gt; since that already has more information in it.  The stack trace shown here is from the OSS, which is blocked on the OST object precreate.  The stack trace shown in the 17712 ticket is the timeout on the MDS caused by waiting for new OST object precreation to complete, which is only a symptom of the actual deadlock problem on the OSS.   &lt;/p&gt;</comment>
                            <comment id="137344" author="cliffw" created="Wed, 23 Dec 2015 21:30:26 +0000"  >&lt;p&gt;I dumped the stacks on iws2. It&apos;s a while since the error, this file includes all the timeout stacks&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="33039">LU-7404</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="19998" name="iws2.stackes.txt.gz" size="139711" author="cliffw" created="Wed, 23 Dec 2015 21:30:26 +0000"/>
                            <attachment id="19997" name="lustre-log.1450900053.30734.gz" size="3417227" author="cliffw" created="Wed, 23 Dec 2015 19:54:55 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzxwpr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>