<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:11:38 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-7754] DNE3: osd-zfs gets into a livelock if transaction is too big</title>
                <link>https://jira.whamcloud.com/browse/LU-7754</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;ONLY=300k bash sanity.sh:&lt;/p&gt;

&lt;p&gt;[   89.828294] LNet: Service thread pid 4249 was inactive for 40.00s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace for debugging purposes:&lt;br/&gt;
[   89.831356] Pid: 4249, comm: mdt01_001&lt;br/&gt;
[   89.831895] &lt;br/&gt;
[   89.831895] Call Trace:&lt;br/&gt;
[   89.832451]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810ac6de&amp;gt;&amp;#93;&lt;/span&gt; ? getrawmonotonic+0x2e/0xc0&lt;br/&gt;
[   89.833222]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810828c5&amp;gt;&amp;#93;&lt;/span&gt; __cond_resched+0x25/0x40&lt;br/&gt;
[   89.834035]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814e521a&amp;gt;&amp;#93;&lt;/span&gt; _cond_resched+0x2a/0x40&lt;br/&gt;
[   89.834810]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814e5f11&amp;gt;&amp;#93;&lt;/span&gt; mutex_lock+0x11/0x40&lt;br/&gt;
[   89.835565]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07741b4&amp;gt;&amp;#93;&lt;/span&gt; dmu_tx_assign+0x284/0x500 &lt;span class=&quot;error&quot;&gt;&amp;#91;zfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
[   89.836410]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0a1ae32&amp;gt;&amp;#93;&lt;/span&gt; osd_trans_start+0xb2/0x410 &lt;span class=&quot;error&quot;&gt;&amp;#91;osd_zfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
[   89.837282]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa032de15&amp;gt;&amp;#93;&lt;/span&gt; top_trans_start+0x255/0x9c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
[   89.838090]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0bb88f9&amp;gt;&amp;#93;&lt;/span&gt; lod_trans_start+0x59/0x60 &lt;span class=&quot;error&quot;&gt;&amp;#91;lod&amp;#93;&lt;/span&gt;&lt;br/&gt;
[   89.838854]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ae3cdf&amp;gt;&amp;#93;&lt;/span&gt; mdd_trans_start+0xf/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdd&amp;#93;&lt;/span&gt;&lt;br/&gt;
[   89.839594]  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0acf1a0&amp;gt;&amp;#93;&lt;/span&gt; mdd_create+0x1170/0x1c70 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdd&amp;#93;&lt;/span&gt;&lt;/p&gt;
</description>
                <environment></environment>
        <key id="34542">LU-7754</key>
            <summary>DNE3: osd-zfs gets into a livelock if transaction is too big</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="bzzz">Alex Zhuravlev</assignee>
                                    <reporter username="bzzz">Alex Zhuravlev</reporter>
                        <labels>
                            <label>dne3</label>
                            <label>zfs</label>
                    </labels>
                <created>Sun, 7 Feb 2016 14:30:44 +0000</created>
                <updated>Tue, 27 Aug 2019 17:51:50 +0000</updated>
                                            <version>Lustre 2.8.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="141486" author="gerrit" created="Sun, 7 Feb 2016 15:38:25 +0000"  >&lt;p&gt;Alex Zhuravlev (alexey.zhuravlev@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/18341&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/18341&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-7754&quot; title=&quot;DNE3: osd-zfs gets into a livelock if transaction is too big&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-7754&quot;&gt;LU-7754&lt;/a&gt; osd: osd-zfs should not wait indefinitely for a TXG&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: ebef50ed6f5032697f05c4bcc20c7fb329423a17&lt;/p&gt;</comment>
                            <comment id="141492" author="adilger" created="Mon, 8 Feb 2016 08:05:09 +0000"  >&lt;p&gt;Your patch turn this from a hang into a failure. That is an improvement, but it doesn&apos;t explain why this test failed?  Do you have an unusual config (small MDT?) or is there some regression that makes the transaction too large?&lt;/p&gt;</comment>
                            <comment id="141495" author="bzzz" created="Mon, 8 Feb 2016 08:52:14 +0000"  >&lt;p&gt;sanity/300k tries to create a big striped directory:&lt;/p&gt;

&lt;p&gt;	$LFS setdirstripe -i 0 -c512 $DIR/$tdir/striped_dir&lt;/p&gt;

&lt;p&gt;with default MDSSIZE=200000 DMU fails to start such a big transaction.&lt;/p&gt;
</comment>
                            <comment id="141527" author="adilger" created="Mon, 8 Feb 2016 18:11:33 +0000"  >&lt;p&gt;How large is the transaction?  Do we have a larger MDS size in our testing?&lt;/p&gt;

&lt;p&gt;I guess this is because we don&apos;t run DNE + ZFS by default. &lt;/p&gt;</comment>
                            <comment id="141541" author="bzzz" created="Mon, 8 Feb 2016 19:00:38 +0000"  >&lt;p&gt;transaction calculations:&lt;br/&gt;
mem 4986830848, asize 119683940352, fsize 8506441728, usize 8497152000&lt;/p&gt;

&lt;p&gt;it seem to fail because of insufficient memory: 4986830848 (4755MB) is needed while the test system had 4GB in total.&lt;/p&gt;</comment>
                            <comment id="192560" author="adilger" created="Tue, 18 Apr 2017 18:46:15 +0000"  >&lt;p&gt;That is &lt;tt&gt;4755 MB / 512 stripes = 9 MB/stripe&lt;/tt&gt; which seems like a lot of space to reserve?  I thought we got away from O(n^2) transaction sizes for striped directories?&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="43694">LU-9096</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="37556">LU-8267</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzy0lr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>