<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:22:40 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-15947] Spinlock contention during wake_up_all() in obd_put_mod_rpc_slot()</title>
                <link>https://jira.whamcloud.com/browse/LU-15947</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Multiple nodes down with spinlock contention&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;c0-0c0s14n1-2204300051.cdump:crash_x86_64&amp;gt; sys
      KERNEL: vmlinux-5.3.18-59.34_7.0.4.6-cray_ari_c
    DUMPFILE: c0-0c0s14n1-2204300051.cdump  [PARTIAL DUMP]
        CPUS: 256
        DATE: Fri Apr 29 15:59:58 CDT 2022
      UPTIME: 02:20:22
LOAD AVERAGE: 214.66, 137.29, 95.43
       TASKS: 2710
    NODENAME: nid00057
     RELEASE: 5.3.18-59.34_7.0.4.6-cray_ari_c
     VERSION: #1 SMP Wed Apr 27 03:52:58 UTC 2022 (cce0346)
     MACHINE: x86_64  (1300 Mhz)
      MEMORY: 95.9 GB
       PANIC: &quot;&quot;
crash_x86_64&amp;gt;
crash_x86_64&amp;gt; epython rcu
sched struct rcu_state ffffffff82059000 in progress (last activity 4296989573/ period end 4296989561) for 8243 jiffies
  show the queue length with -lcpu 255 sched PENDING, not stalled yet (not completed) ** Execution took   0.02s (real)   0.02s (CPU)
crash_x86_64&amp;gt;rcu thread has not run for almost 8243 jiffies or 32 secondsThere are 135 CPUs that are currently spinning on some  lock
 most of these are in the following stack trace:crash_x86_64&amp;gt; bt -c 255
PID: 34632  TASK: ffff889708048940  CPU: 255  COMMAND: &quot;ldlm_bl_10&quot;
    [exception RIP: queued_spin_lock_slowpath+377]
    RIP: ffffffff810d1a49  RSP: ffffc9000fca7aa0  RFLAGS: 00000046
    RAX: 0000000000000000  RBX: ffff88972ed9b060  RCX: 0000000004000000
    RDX: ffff8897ddbe9dc0  RSI: 00000000000000ab  RDI: ffff88972ed9b060
    RBP: ffffc9000fca7aa0   R8: 0000000004000000   R9: 0000000000028a80
    R10: ffffc9000fca79a0  R11: 000000000000010e  R12: 0000000000000202
    R13: 0000000000000202  R14: 0000000000000000  R15: 0000000000000003
    CS: 0010  SS: 0018
 #0 [ffffc9000fca7aa8] _raw_spin_lock_irqsave at ffffffff81703da7
 #1 [ffffc9000fca7ac8] __wake_up_common_lock at ffffffff810c5dc3
 #2 [ffffc9000fca7b38] __wake_up at ffffffff810c5e33
 #3 [ffffc9000fca7b48] obd_put_mod_rpc_slot at ffffffffa04f5964 [obdclass]
 #4 [ffffc9000fca7b68] ptlrpc_put_mod_rpc_slot at ffffffffa067fd34 [ptlrpc]
 #5 [ffffc9000fca7b90] mdc_close at ffffffffa08783ac [mdc]
 #6 [ffffc9000fca7be0] lmv_close at ffffffffa08b7d82 [lmv]
 #7 [ffffc9000fca7c20] ll_close_inode_openhandle at ffffffffa08f7641 [lustre]
 #8 [ffffc9000fca7c78] ll_md_real_close at ffffffffa08fa7ce [lustre]
 #9 [ffffc9000fca7ca8] ll_md_blocking_ast at ffffffffa092db4d [lustre]
#10 [ffffc9000fca7d10] ldlm_cancel_callback at ffffffffa0660128 [ptlrpc]
#11 [ffffc9000fca7d68] ldlm_cli_cancel_local at ffffffffa066d8e5 [ptlrpc]
#12 [ffffc9000fca7d90] ldlm_cli_cancel at ffffffffa0672d2b [ptlrpc]
#13 [ffffc9000fca7df8] ll_md_blocking_ast at ffffffffa092d510 [lustre]
#14 [ffffc9000fca7e60] ldlm_handle_bl_callback at ffffffffa0675c30 [ptlrpc]
#15 [ffffc9000fca7e88] ldlm_bl_thread_main at ffffffffa067641a [ptlrpc]
#16 [ffffc9000fca7f08] kthread at ffffffff810a2400
#17 [ffffc9000fca7f50] ret_from_fork at ffffffff8180021a
crash_x86_64&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="70756">LU-15947</key>
            <summary>Spinlock contention during wake_up_all() in obd_put_mod_rpc_slot()</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="stancheff">Shaun Tancheff</assignee>
                                    <reporter username="stancheff">Shaun Tancheff</reporter>
                        <labels>
                    </labels>
                <created>Wed, 15 Jun 2022 09:53:09 +0000</created>
                <updated>Mon, 11 Dec 2023 07:18:31 +0000</updated>
                            <resolved>Thu, 9 Mar 2023 20:20:39 +0000</resolved>
                                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="337809" author="gerrit" created="Wed, 15 Jun 2022 09:55:25 +0000"  >&lt;p&gt;&quot;Shaun Tancheff &amp;lt;shaun.tancheff@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/47634&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/47634&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15947&quot; title=&quot;Spinlock contention during wake_up_all() in obd_put_mod_rpc_slot()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15947&quot;&gt;&lt;del&gt;LU-15947&lt;/del&gt;&lt;/a&gt; ptlrpc: Sort waiters on close_req completion&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 4eb788baf0bdd5241999f101e17c00c275e067e0&lt;/p&gt;</comment>
                            <comment id="352090" author="gerrit" created="Tue, 8 Nov 2022 08:50:09 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/44041/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/44041/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15947&quot; title=&quot;Spinlock contention during wake_up_all() in obd_put_mod_rpc_slot()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15947&quot;&gt;&lt;del&gt;LU-15947&lt;/del&gt;&lt;/a&gt; obdclass: improve precision of wakeups for mod_rpcs&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 5243630b09d22e0b576d81390d604774881f63f7&lt;/p&gt;</comment>
                            <comment id="365424" author="spitzcor" created="Thu, 9 Mar 2023 20:20:39 +0000"  >&lt;p&gt;I think we can consider this resolved with the landing of &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/44041&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/44041&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="365425" author="spitzcor" created="Thu, 9 Mar 2023 20:21:49 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=stancheff&quot; class=&quot;user-hover&quot; rel=&quot;stancheff&quot;&gt;stancheff&lt;/a&gt;, do you agree?  ^^^&lt;br/&gt;
Please open a new ticket if there is remaining work.&lt;/p&gt;</comment>
                            <comment id="377255" author="gerrit" created="Mon, 3 Jul 2023 13:40:04 +0000"  >&lt;p&gt;&quot;Etienne AUJAMES &amp;lt;eaujames@ddn.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51538&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51538&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15947&quot; title=&quot;Spinlock contention during wake_up_all() in obd_put_mod_rpc_slot()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15947&quot;&gt;&lt;del&gt;LU-15947&lt;/del&gt;&lt;/a&gt; obdclass: improve precision of wakeups for mod_rpcs&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 54e1ad7ad3c8f894d0805d9765f341e112c38afe&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="78392">LU-17197</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="75015">LU-16633</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02s73:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>