<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:26:12 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16343] soft lockups ptlrpcd</title>
                <link>https://jira.whamcloud.com/browse/LU-16343</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;kernel: NMI watchdog: BUG: soft lockup - CPU#23 stuck for 22s! [ptlrpcd_01_10:3531&lt;/p&gt;

&lt;p&gt;full version: 2.12.8_6_g5457c37-1.el7&lt;/p&gt;

&lt;p&gt;Can you let me know what debugging options I should turn on to get the info needed to diagnose the issue.&lt;/p&gt;</description>
                <environment></environment>
        <key id="73396">LU-16343</key>
            <summary>soft lockups ptlrpcd</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="4">Incomplete</resolution>
                                        <assignee username="bzzz">Alex Zhuravlev</assignee>
                                    <reporter username="dneg">Dneg</reporter>
                        <labels>
                    </labels>
                <created>Fri, 25 Nov 2022 11:41:05 +0000</created>
                <updated>Fri, 30 Jun 2023 15:40:45 +0000</updated>
                            <resolved>Fri, 27 Jan 2023 14:40:50 +0000</resolved>
                                    <version>Lustre 2.12.8</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="354168" author="bzzz" created="Fri, 25 Nov 2022 11:53:40 +0000"  >&lt;p&gt;any stack trace following that message?&lt;/p&gt;</comment>
                            <comment id="354175" author="dneg" created="Fri, 25 Nov 2022 12:53:52 +0000"  >&lt;p&gt;Hi Alex, yes, sorry, pasted below:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
Nov  9 03:11:25 foxtrot3 kernel: NMI watchdog: BUG: soft lockup - CPU#23 stuck &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; 22s! [ptlrpcd_01_10:3531]
Nov  9 03:11:25 foxtrot3 kernel: Modules linked in: rpcsec_gss_krb5 vfat fat mpt3sas mpt2sas raid_class scsi_transport_sas mptctl mptbase nfsv3 nfs fscache mgc(OE) lustre(OE) lmv(OE) mdc(OE) fid(OE) osc(OE) lov(OE) fld(OE) ksocklnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE) dell_rbu libcfs(OE) binfmt_misc bonding iTCO_wdt iTCO_vendor_support dcdbas joydev sb_edac intel_powerclamp coretemp intel_rapl iosf_mbi kvm_intel kvm irqbypass sg ipmi_si ipmi_devintf ipmi_msghandler acpi_pad wmi acpi_power_meter mei_me mei lpc_ich nfsd auth_rpcgss nfs_acl lockd grace ip_tables xfs sd_mod crc_t10dif crct10dif_generic 8021q garp mrp stp llc mgag200 i2c_algo_bit drm_kms_helper syscopyarea sysfillrect sysimgblt fb_sys_fops ttm crct10dif_pclmul crct10dif_common bnx2x crc32_pclmul ahci crc32c_intel scsi_transport_iscsi ghash_clmulni_intel libahci
Nov  9 03:11:25 foxtrot3 kernel: drm aesni_intel libata lrw gf128mul glue_helper ablk_helper cryptd megaraid_sas drm_panel_orientation_quirks dm_multipath ptp pps_core mdio libcrc32c sunrpc dm_mirror dm_region_hash dm_log dm_mod [last unloaded: usb_storage]
Nov  9 03:11:25 foxtrot3 kernel: CPU: 23 PID: 3531 Comm: ptlrpcd_01_10 Kdump: loaded Tainted: G           OE  ------------   3.10.0-1160.49.1.el7.x86_64 #1
Nov  9 03:11:25 foxtrot3 kernel: Hardware name: Dell Inc. PowerEdge R620/0KCKR5, BIOS 2.5.4 01/22/2016
Nov  9 03:11:25 foxtrot3 kernel: task: ffff9b81766a5280 ti: ffff9b817f080000 task.ti: ffff9b817f080000
Nov  9 03:11:25 foxtrot3 kernel: RIP: 0010:[&amp;lt;ffffffffa3b17aa2&amp;gt;]  [&amp;lt;ffffffffa3b17aa2&amp;gt;] native_queued_spin_lock_slowpath+0x122/0x200
Nov  9 03:11:25 foxtrot3 kernel: RSP: 0018:ffff9b817f083ad0  EFLAGS: 00000246
Nov  9 03:11:25 foxtrot3 kernel: RAX: 0000000000000000 RBX: ffff9b8ab3ab6a00 RCX: 0000000000b90000
Nov  9 03:11:25 foxtrot3 kernel: RDX: ffff9ba17f15b8c0 RSI: 0000000000590001 RDI: ffff9b95f1d56de4
Nov  9 03:11:25 foxtrot3 kernel: RBP: ffff9b817f083ad0 R08: ffff9ba17f2db8c0 R09: 0000000000000000
Nov  9 03:11:25 foxtrot3 kernel: R10: 0000000000000001 R11: ffff9b8ab3ab6a00 R12: ffffffffc09175f8
Nov  9 03:11:25 foxtrot3 kernel: R13: ffff9b8ab3ab6a00 R14: ffff9b817e897000 R15: ffffffffa3c26900
Nov  9 03:11:25 foxtrot3 kernel: FS:  0000000000000000(0000) GS:ffff9ba17f2c0000(0000) knlGS:0000000000000000
Nov  9 03:11:25 foxtrot3 kernel: CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
Nov  9 03:11:25 foxtrot3 kernel: CR2: 000055f56a905fb8 CR3: 000000293f08e000 CR4: 00000000000607e0
Nov  9 03:11:25 foxtrot3 kernel: Call Trace:
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa417dcf3&amp;gt;] queued_spin_lock_slowpath+0xb/0xf
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa418baa0&amp;gt;] _raw_spin_lock+0x20/0x30
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc1041bec&amp;gt;] osc_page_delete+0x1fc/0x500 [osc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0ce1550&amp;gt;] cl_page_delete0+0x80/0x220 [obdclass]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0ce1723&amp;gt;] cl_page_delete+0x33/0x110 [obdclass]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc1041861&amp;gt;] discard_pagevec+0x91/0x130 [osc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc104263a&amp;gt;] osc_lru_shrink+0x74a/0x7c0 [osc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc104364c&amp;gt;] lru_queue_work+0x4c/0x230 [osc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0eae31a&amp;gt;] work_interpreter+0x3a/0xf0 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0eab231&amp;gt;] ptlrpc_check_set.part.23+0x481/0x1dd0 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa3ae26ec&amp;gt;] ? set_next_entity+0x3c/0xe0
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0eacbdb&amp;gt;] ptlrpc_check_set+0x5b/0xe0 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0ed810b&amp;gt;] ptlrpcd_check+0x4ab/0x590 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0ed84f0&amp;gt;] ptlrpcd+0x300/0x560 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa3adadf0&amp;gt;] ? wake_up_state+0x20/0x20
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffc0ed81f0&amp;gt;] ? ptlrpcd_check+0x590/0x590 [ptlrpc]
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa3ac5e61&amp;gt;] kthread+0xd1/0xe0
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa3ac5d90&amp;gt;] ? insert_kthread_work+0x40/0x40
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa4195df7&amp;gt;] ret_from_fork_nospec_begin+0x21/0x21
Nov  9 03:11:25 foxtrot3 kernel: [&amp;lt;ffffffffa3ac5d90&amp;gt;] ? insert_kthread_work+0x40/0x40
Nov  9 03:11:25 foxtrot3 kernel: Code: 13 48 c1 ea 0d 48 98 83 e2 30 48 81 c2 c0 b8 01 00 48 03 14 c5 60 15 75 a4 4c 89 02 41 8b 40 08 85 c0 75 0f 0f 1f 44 00 00 f3 90 &amp;lt;41&amp;gt; 8b 40 08 85 c0 74 f6 4d 8b 08 4d 85 c9 74 04 41 0f 18 09 8b
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="356433" author="dneg" created="Wed, 14 Dec 2022 16:30:59 +0000"  >&lt;p&gt;Hi Alex,&lt;/p&gt;

&lt;p&gt;Do you need any further information?&lt;/p&gt;

&lt;p&gt;Kind regards,&lt;br/&gt;
Campbell&lt;/p&gt;</comment>
                            <comment id="356810" author="bzzz" created="Mon, 19 Dec 2022 08:30:52 +0000"  >&lt;p&gt;can you please attach full dmesg/syslog output? probably something bad happened before.&lt;/p&gt;</comment>
                            <comment id="357624" author="dneg" created="Thu, 29 Dec 2022 11:01:41 +0000"  >&lt;p&gt;Hi Alex,&lt;/p&gt;

&lt;p&gt;ful syslog file attached&lt;/p&gt;</comment>
                            <comment id="359122" author="bzzz" created="Sat, 14 Jan 2023 19:27:19 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=dneg&quot; class=&quot;user-hover&quot; rel=&quot;dneg&quot;&gt;dneg&lt;/a&gt; thanks for the log. unfortuntely the log has the only trace, so I can&apos;t idenfity another thread holding the spinlock. ideally we need a crashdump or full set of traces (echo t &amp;gt;/proc/sysrq-trigger) to be able to find which process was holding the spinlock so blocking ptlrpcd.&lt;/p&gt;</comment>
                            <comment id="359196" author="dneg" created="Mon, 16 Jan 2023 18:28:10 +0000"  >&lt;p&gt;Hi Alex,&lt;/p&gt;

&lt;p&gt;We have had only one ptlrpcd lockup since the beginning of December last year. I think we could close this ticket for now, and open a new one if needed&lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
Campbell&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="47541" name="2022-11-09-syslog.log.gz" size="568807" author="dneg" created="Thu, 29 Dec 2022 11:01:08 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i036k7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>