<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:01:01 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13408] tgt_cancel_slc_locks()) ASSERTION( lock-&gt;l_client_cookie != 0 )</title>
                <link>https://jira.whamcloud.com/browse/LU-13408</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;An assertion is triggered, and it mean the request-&amp;gt;rq_transno is 0.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[25892.430672] LustreError: 137-5: fs0a92-OST0006_UUID: not available for connect from 172.16.0.32@o2ib (no target). If you are running an HA pair check that the target is mounted on the other server.
[25892.435324] LustreError: Skipped 74 previous similar messages
[27887.087931] LustreError: 27219:0:(tgt_main.c:354:tgt_cancel_slc_locks()) ASSERTION( lock-&amp;gt;l_client_cookie != 0 ) failed: 
[27887.090610] LustreError: 27219:0:(tgt_main.c:354:tgt_cancel_slc_locks()) LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="58592">LU-13408</key>
            <summary>tgt_cancel_slc_locks()) ASSERTION( lock-&gt;l_client_cookie != 0 )</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="laisiyao">Lai Siyao</reporter>
                        <labels>
                    </labels>
                <created>Thu, 2 Apr 2020 09:53:24 +0000</created>
                <updated>Tue, 16 Jun 2020 03:30:42 +0000</updated>
                            <resolved>Tue, 16 Jun 2020 03:30:42 +0000</resolved>
                                    <version>Lustre 2.14.0</version>
                                    <fixVersion>Lustre 2.14.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="266741" author="green" created="Thu, 2 Apr 2020 20:11:40 +0000"  >&lt;p&gt;This same failure made a noticeable appearance in current master-next, but ther&apos;s nothing I am able to attribute it to yet.&lt;/p&gt;

&lt;p&gt;It always happened in sanity 300a&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[30778.381687] Lustre: DEBUG MARKER: == sanity test 300a: basic striped dir sanity test =================================================== 13:43:36 (1585763016)
[30779.451744] LustreError: 23319:0:(tgt_main.c:357:tgt_cancel_slc_locks()) ASSERTION( lock-&amp;gt;l_client_cookie != 0 ) failed: 
[30779.474964] LustreError: 23319:0:(tgt_main.c:357:tgt_cancel_slc_locks()) LBUG
[30779.477837] Pid: 23319, comm: jbd2/dm-0-8 3.10.0-7.7-debug #1 SMP Wed Oct 30 08:47:36 EDT 2019
[30779.482233] Call Trace:
[30779.483993]  [&amp;lt;ffffffffa03b3ddc&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[30779.486127]  [&amp;lt;ffffffffa03b3e8c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[30779.488094]  [&amp;lt;ffffffffa07eb08f&amp;gt;] tgt_cancel_slc_locks+0x1cf/0x1e0 [ptlrpc]
[30779.491227]  [&amp;lt;ffffffffa07ecdb6&amp;gt;] tgt_cb_last_committed+0x116/0x390 [ptlrpc]
[30779.496651]  [&amp;lt;ffffffffa0ce44db&amp;gt;] osd_trans_commit_cb+0xcb/0x2c0 [osd_ldiskfs]
[30779.500512]  [&amp;lt;ffffffffa0c86fa4&amp;gt;] ldiskfs_journal_commit_callback+0x84/0xc0 [ldiskfs]
[30779.504687]  [&amp;lt;ffffffffa0b14e9b&amp;gt;] jbd2_journal_commit_transaction+0x186b/0x1ca0 [jbd2]
[30779.514340]  [&amp;lt;ffffffffa0b1a87d&amp;gt;] kjournald2+0xcd/0x280 [jbd2]
[30779.516415]  [&amp;lt;ffffffff810b8254&amp;gt;] kthread+0xe4/0xf0
[30779.518263]  [&amp;lt;ffffffff817e0ddd&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[30779.522814]  [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
[30779.528997] Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I got like 5 crashes (have crashdumps) on the first run then it subdued and on testing restart got another crash and then it went silent again for now.&lt;/p&gt;</comment>
                            <comment id="267150" author="gerrit" created="Wed, 8 Apr 2020 12:35:33 +0000"  >&lt;p&gt;Alex Zhuravlev (bzzz@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38177&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38177&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13408&quot; title=&quot;tgt_cancel_slc_locks()) ASSERTION( lock-&amp;gt;l_client_cookie != 0 )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13408&quot;&gt;&lt;del&gt;LU-13408&lt;/del&gt;&lt;/a&gt; tests: pass localrecov to MGS&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: c89337791dc9f026dfbbf2ac695dac7254a9800e&lt;/p&gt;</comment>
                            <comment id="267152" author="bzzz" created="Wed, 8 Apr 2020 12:41:58 +0000"  >&lt;p&gt;the patch above is a workaround. the root cause is that MDT got mounted w/o localrecov option and then the client&apos;s request had no transno,&lt;br/&gt;
which in turn used to track commit status of cross-mdt operations.&lt;br/&gt;
I &lt;em&gt;guess&lt;/em&gt; this can be solved by a per-tx callback, instead of using transno.&lt;/p&gt;</comment>
                            <comment id="267965" author="adilger" created="Sun, 19 Apr 2020 07:56:09 +0000"  >&lt;p&gt;Alex, wouldn&apos;t it be better to handle this by ignoring the &quot;localrecov&quot; behavior for MDT and MGT mounts, rather than changing the transaction callback?&lt;/p&gt;</comment>
                            <comment id="268419" author="adilger" created="Thu, 23 Apr 2020 22:39:01 +0000"  >&lt;p&gt;I &lt;em&gt;think&lt;/em&gt; this issue is fixed by patch&#160;&lt;a href=&quot;https://review.whamcloud.com/38138&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38138&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13402&quot; title=&quot;sanity test_252: Invalid number of mdtlov clients returned by /usr/sbin/lr_reader&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13402&quot;&gt;&lt;del&gt;LU-13402&lt;/del&gt;&lt;/a&gt; target: never exclude MDT/OST from last_rcvd&lt;/tt&gt;&quot; but I&apos;d like Alex to confirm before this issue is closed.&lt;/p&gt;</comment>
                            <comment id="268463" author="bzzz" created="Fri, 24 Apr 2020 06:04:13 +0000"  >&lt;p&gt;Andreas, no, these are different problems. &lt;em&gt;this&lt;/em&gt; issue happens because &lt;em&gt;client&lt;/em&gt; (running on MDS) is excluded from recovery, thus doesn&apos;t generate a transno which is used to track committness (in turn used to cancel locks).&lt;/p&gt;
</comment>
                            <comment id="269133" author="adilger" created="Fri, 1 May 2020 20:22:14 +0000"  >&lt;p&gt;+1 on master running sanity test_103a in my VM.&lt;br/&gt;
+1 on master running sanity test_103b in my VM.&lt;/p&gt;

&lt;p&gt;Seems like this is easy for me to reproduce if there is something that you think will fix this properly.&lt;/p&gt;</comment>
                            <comment id="272065" author="laisiyao" created="Fri, 5 Jun 2020 13:34:12 +0000"  >&lt;p&gt;LDLM lock is handled in MDT layer, while transaction is in MDD layer, it&apos;s layer violation to mix them together. IMO if &quot;req_transno&quot; of an operation is not 0, it&apos;s not needed to enforce Commit-on-Sharing for such operation.&lt;/p&gt;</comment>
                            <comment id="272169" author="gerrit" created="Sun, 7 Jun 2020 12:53:53 +0000"  >&lt;p&gt;Lai Siyao (lai.siyao@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38855&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38855&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13408&quot; title=&quot;tgt_cancel_slc_locks()) ASSERTION( lock-&amp;gt;l_client_cookie != 0 )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13408&quot;&gt;&lt;del&gt;LU-13408&lt;/del&gt;&lt;/a&gt; mdt: don&apos;t save remote lock if req_transno is 0&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: af33439d1e383d10b226870fd533f33ffac7f078&lt;/p&gt;</comment>
                            <comment id="272946" author="gerrit" created="Tue, 16 Jun 2020 02:21:50 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/38855/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38855/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13408&quot; title=&quot;tgt_cancel_slc_locks()) ASSERTION( lock-&amp;gt;l_client_cookie != 0 )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13408&quot;&gt;&lt;del&gt;LU-13408&lt;/del&gt;&lt;/a&gt; target: update in-memory per client data&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 300858ccfcd00b52663de45e0bb472012242f342&lt;/p&gt;</comment>
                            <comment id="272950" author="pjones" created="Tue, 16 Jun 2020 03:30:42 +0000"  >&lt;p&gt;Landed for 2.14&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="58560">LU-13402</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00wun:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>