<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:54:28 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-12651] High kworker CPU usage (osc_grant_work_handler) on IDLE connections</title>
                <link>https://jira.whamcloud.com/browse/LU-12651</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;We discovered that on our systems with lustre mounted, the kworker is using signifficant amount of CPU. &lt;br/&gt;
perf top shows on an idle system: &lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt; 39.44%  [kernel]                  [k] osc_should_shrink_grant
  12.14%  [kernel]                  [k] osc_grant_work_handler
   2.81%  [kernel]                  [k] process_one_work
   2.64%  [kernel]                  [k] __queue_work
   2.56%  [kernel]                  [k] read_tsc
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;We currently have grant_shrink=0 on this system. &lt;/p&gt;

&lt;p&gt;Looks like doing just du -hs /fs makes the problem go away for some time. &lt;br/&gt;
Also unmounting the filesystem makes the problem go away. &lt;br/&gt;
This is Centos 7.6 system with Lustre 2.12.0&lt;/p&gt;</description>
                <environment></environment>
        <key id="56628">LU-12651</key>
            <summary>High kworker CPU usage (osc_grant_work_handler) on IDLE connections</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="zam">Alexander Zarochentsev</assignee>
                                    <reporter username="Tomaka">Jacek Tomaka</reporter>
                        <labels>
                            <label>LTS12</label>
                    </labels>
                <created>Fri, 9 Aug 2019 09:05:34 +0000</created>
                <updated>Tue, 25 Feb 2020 12:58:34 +0000</updated>
                            <resolved>Fri, 14 Feb 2020 13:41:52 +0000</resolved>
                                    <version>Lustre 2.12.2</version>
                                    <fixVersion>Lustre 2.14.0</fixVersion>
                    <fixVersion>Lustre 2.12.5</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="252853" author="tomaka" created="Fri, 9 Aug 2019 09:19:50 +0000"  >&lt;p&gt;Most likely regression from &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8708&quot; title=&quot;Grant shrinking disabled all the time&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8708&quot;&gt;&lt;del&gt;LU-8708&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="260719" author="tomaka" created="Wed, 8 Jan 2020 03:33:51 +0000"  >&lt;p&gt;Any news on this ticket?&lt;/p&gt;</comment>
                            <comment id="262555" author="gerrit" created="Tue, 4 Feb 2020 17:53:23 +0000"  >&lt;p&gt;Alexander Zarochentsev (c17826@cray.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37429&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37429&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12651&quot; title=&quot;High kworker CPU usage (osc_grant_work_handler) on IDLE connections&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12651&quot;&gt;&lt;del&gt;LU-12651&lt;/del&gt;&lt;/a&gt; osc: always call update_next_shrink&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 2986155c51914c5a63f6c351908c9a49dbe5042f&lt;/p&gt;</comment>
                            <comment id="262558" author="zam" created="Tue, 4 Feb 2020 17:56:12 +0000"  >&lt;p&gt;Jasek Tomaka, &lt;br/&gt;
can you try &lt;a href=&quot;https://review.whamcloud.com/37429&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37429&lt;/a&gt; ?&lt;/p&gt;</comment>
                            <comment id="262571" author="zam" created="Tue, 4 Feb 2020 19:18:18 +0000"  >&lt;p&gt;my experiments with 2.12-based lustre and grant_shrink=0:&lt;/p&gt;

&lt;p&gt;w/o the fix, kworker starts to eat 100% CPU after 20 min from Lustre mount time (default grant shrinking interval)&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;top - 00:03:08 up 2 days, 11:32,  3 users,  load average: 2.95, 2.47, 2.22
Tasks: 258 total,   3 running, 255 sleeping,   0 stopped,   0 zombie
%Cpu(s):  0.0 us, 25.0 sy,  0.0 ni, 75.0 id,  0.0 wa,  0.0 hi,  0.0 si,  0.0 st
KiB Mem :  2914024 total,  1138684 free,   544988 used,  1230352 buff/cache
KiB Swap:  2113532 total,  2113532 free,        0 used.  2190536 avail Mem 

  PID USER      PR  NI    VIRT    RES    SHR S  %CPU %MEM     TIME+ COMMAND                                                                                        
21631 root      20   0       0      0      0 R 100.0  0.0   3:03.08 kworker/3:2                                                                                    
    1 root      20   0  191032   3912   2584 S   0.0  0.1   0:06.70 systemd                                                                                        
    2 root      20   0       0      0      0 S   0.0  0.0   0:00.06 kthreadd                                                                                       
    3 root      20   0       0      0      0 S   0.0  0.0   0:01.06 ksoftirqd/0                                                                                    
    5 root       0 -20       0      0      0 S   0.0  0.0   0:00.00 kworker/0:0H                                                                                   
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;with the fix,&#160; 22 min after start, system is idle:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;top - 00:32:05 up 2 days, 12:01,  3 users,  load average: 2.00, 2.01, 2.06
Tasks: 261 total,   2 running, 259 sleeping,   0 stopped,   0 zombie
%Cpu(s):  0.1 us,  0.1 sy,  0.0 ni, 99.8 id,  0.0 wa,  0.0 hi,  0.0 si,  0.0 st
KiB Mem :  2914024 total,  1133004 free,   549940 used,  1231080 buff/cache
KiB Swap:  2113532 total,  2113532 free,        0 used.  2185136 avail Mem 

  PID USER      PR  NI    VIRT    RES    SHR S  %CPU %MEM     TIME+ COMMAND                                                                                        
  367 root      20   0  162180   2456   1584 R   0.3  0.1   0:00.03 top                                                                                            
    1 root      20   0  191032   3912   2584 S   0.0  0.1   0:06.85 systemd                                                                                        
    2 root      20   0       0      0      0 S   0.0  0.0   0:00.07 kthreadd                                                                                       
    3 root      20   0       0      0      0 S   0.0  0.0   0:01.10 ksoftirqd/0                                                                                    
    5 root       0 -20       0      0      0 S   0.0  0.0   0:00.00 kworker/0:0H                                                                                   
    7 root      rt   0       0      0      0 S   0.0  0.0   0:00.61 migration/0                                                                                    
    8 root      20   0       0      0      0 S   0.0  0.0   0:00.00 rcu_bh                                                                                         
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="262584" author="tomaka" created="Wed, 5 Feb 2020 00:43:55 +0000"  >&lt;p&gt;Hi Alexander, &lt;br/&gt;
Thanks for looking into it. Would you be so kind to provide patch for 2.12.3 as well?&lt;br/&gt;
Regards.&lt;br/&gt;
Jacek Tomaka&lt;/p&gt;</comment>
                            <comment id="262591" author="zam" created="Wed, 5 Feb 2020 04:16:08 +0000"  >&lt;p&gt;Jacek,&lt;br/&gt;
&amp;gt;Thanks for looking into it. Would you be so kind to provide patch for 2.12.3 as well?&lt;br/&gt;
The same patch applies to b2_12.&lt;/p&gt;</comment>
                            <comment id="263014" author="tomaka" created="Mon, 10 Feb 2020 16:40:58 +0000"  >&lt;p&gt;Hi Alexander, &lt;br/&gt;
Our initial testing on a machine with patched client(2.12.3 + &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12759&quot; title=&quot;parameter grant_shrink gets reset to 1 after client reconnects&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12759&quot;&gt;&lt;del&gt;LU-12759&lt;/del&gt;&lt;/a&gt; + this patch) shows that the kworker does not go crazy anymore. &lt;br/&gt;
Great job! Thanks!&lt;br/&gt;
Will let you know if we run into any issues with this patch. &lt;br/&gt;
Jacek Tomaka&lt;/p&gt;</comment>
                            <comment id="263288" author="gerrit" created="Fri, 14 Feb 2020 05:49:35 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37429/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37429/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12651&quot; title=&quot;High kworker CPU usage (osc_grant_work_handler) on IDLE connections&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12651&quot;&gt;&lt;del&gt;LU-12651&lt;/del&gt;&lt;/a&gt; osc: always call update_next_shrink&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 117f587bc3e60f4dd1c939f8488e43cb752c12ca&lt;/p&gt;</comment>
                            <comment id="263343" author="pjones" created="Fri, 14 Feb 2020 13:41:52 +0000"  >&lt;p&gt;Landed for 2.14&lt;/p&gt;</comment>
                            <comment id="263355" author="gerrit" created="Fri, 14 Feb 2020 15:10:55 +0000"  >&lt;p&gt;Minh Diep (mdiep@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37572&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37572&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12651&quot; title=&quot;High kworker CPU usage (osc_grant_work_handler) on IDLE connections&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12651&quot;&gt;&lt;del&gt;LU-12651&lt;/del&gt;&lt;/a&gt; osc: always call update_next_shrink&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 70d299f149e1cb5f396576baf452a5eba911a30a&lt;/p&gt;</comment>
                            <comment id="263982" author="gerrit" created="Tue, 25 Feb 2020 06:15:57 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37572/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37572/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12651&quot; title=&quot;High kworker CPU usage (osc_grant_work_handler) on IDLE connections&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12651&quot;&gt;&lt;del&gt;LU-12651&lt;/del&gt;&lt;/a&gt; osc: always call update_next_shrink&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 10a799263964422df575038d3dfb507a09bfa221&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                                        </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="40593">LU-8708</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00l0n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>