<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:26:45 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2619] Bogus value of dqb_curinodes returned by osc_quotactl</title>
                <link>https://jira.whamcloud.com/browse/LU-2619</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;When running &lt;tt&gt;lfs quota -u &amp;lt;USER&amp;gt; &amp;lt;FS&amp;gt;&lt;/tt&gt; on Sequoia, a couple users do not have any files in their directory but quota reports a bogus large value:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# lfs quota -u pjmccart /p/ls1
Disk quotas for user pjmccart (uid 8624):
     Filesystem  kbytes   quota   limit   grace   files   quota   limit   grace
         /p/ls1     913       0       0       - 18446744073709547865       0       0       -

# du -sh /p/ls1/pjmccart/
913K    /p/ls1/pjmccart/

# ls -alR /p/ls1/pjmccart/
/p/ls1/pjmccart/:
total 1214
913 drwx------    2 pjmccart pjmccart 934400 Nov 15 10:28 ./
302 drwxr-xr-x 2193 root     root     308736 Jan 11 08:05 ../ 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Using &lt;tt&gt;systemtap&lt;/tt&gt; to print the &lt;tt&gt;obd_quotactl&lt;/tt&gt; structure when the &lt;tt&gt;osc_quotactl&lt;/tt&gt; function returns, I see odd values coming from two of the OSCs:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;osc_quotactl: &quot;ls1-OST0037-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=0, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
osc_quotactl: &quot;ls1-OST0038-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551615, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
osc_quotactl: &quot;ls1-OST0039-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=0, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;osc_quotactl: &quot;ls1-OST0073-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=3, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
osc_quotactl: &quot;ls1-OST0074-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551615, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
osc_quotactl: &quot;ls1-OST0075-osc-c0000003c865a400&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=8624, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=3, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .dqb_padding=0}}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Specifically, the values of &lt;tt&gt;dqb_curinodes&lt;/tt&gt;:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;ls1-OST0074-osc-c0000003c865a400:dqb_curinodes=18446744073709551615
ls1-OST0038-osc-c0000003c865a400:dqb_curinodes=18446744073709551615
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="17170">LU-2619</key>
            <summary>Bogus value of dqb_curinodes returned by osc_quotactl</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="niu">Niu Yawei</assignee>
                                    <reporter username="prakash">Prakash Surya</reporter>
                        <labels>
                            <label>llnl</label>
                    </labels>
                <created>Tue, 15 Jan 2013 11:03:05 +0000</created>
                <updated>Mon, 11 May 2015 21:10:14 +0000</updated>
                            <resolved>Tue, 20 Jan 2015 23:38:31 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="50510" author="pjones" created="Tue, 15 Jan 2013 18:05:04 +0000"  >&lt;p&gt;Niu&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="50526" author="niu" created="Tue, 15 Jan 2013 23:10:49 +0000"  >&lt;p&gt;I suppose the backend is zfs, and the &quot;quota_iused_estimate&quot; is 0 (you can check it under the osd-zfs proc dir), right?&lt;/p&gt;

&lt;p&gt;The curinodes from OSTs will not be counted in the total inode usage at the end, though the number implies something is wrong. I guess the MDC was getting the same number too, is it possible to get some log with D_QUOTA enabled on the MDT or the OSTs which returning invalid number? Thanks.&lt;/p&gt;</comment>
                            <comment id="67262" author="prakash" created="Mon, 23 Sep 2013 17:16:55 +0000"  >&lt;p&gt;Ping. We&apos;re still suffering from this.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# sierra38 /root &amp;gt; cat /proc/fs/lustre/version 
lustre: 2.1.4
kernel: patchless_client
build:  2.1.4-5chaos-5chaos--PRISTINE-2.6.32-358.11.1.2chaos.ch5.1.x86_64
# sierra38 /root &amp;gt; cat TOSS-27.stp 
probe module(&quot;lquota&quot;).function(&quot;client_quota_ctl&quot;).return {
        printf(&quot;%s: %s: %s\n&quot;, probefunc(), @cast($exp, &quot;obd_export&quot;)-&amp;gt;exp_obd-&amp;gt;obd_name$, $oqctl$$);
}
# sierra38 /root &amp;gt; stap TOSS-27.stp -c &quot;lfs quota -u richmond /p/lscratche&quot;
Disk quotas for user richmond (uid 1098):
     Filesystem  kbytes   quota   limit   grace   files   quota   limit   grace
   /p/lscratche       8       0       0       - 18446744073709551606       0       0       -
client_quota_ctl: &quot;lse-MDT0000-mdc-ffff8802fa988c00&quot;: {.qc_cmd=8388615, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=0, .dqb_btime=0, .dqb_itime=0, .dqb_valid=0, .padding=0}}
client_quota_ctl: &quot;lse-OST0001-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=0, .dqb_btime=0, .dqb_itime=0, .dqb_valid=0, .padding=0}}
client_quota_ctl: &quot;lse-OST0002-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551419, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0003-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551442, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0004-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551404, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0005-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551487, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0006-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551433, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0007-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551521, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0008-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551422, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0009-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551416, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000a-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551325, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000b-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551499, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000c-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551469, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000d-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551340, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000e-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551387, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST000f-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551435, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-OST0010-osc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=18446744073709551326, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
client_quota_ctl: &quot;lse-MDT0000-mdc-ffff8802fa988c00&quot;: {.qc_cmd=8388867, .qc_type=0, .qc_id=1098, .qc_stat=0, .qc_dqinfo={.dqi_bgrace=0, .dqi_igrace=0, .dqi_flags=0, .dqi_valid=0}, .qc_dqblk={.dqb_bhardlimit=0, .dqb_bsoftlimit=0, .dqb_curspace=0, .dqb_ihardlimit=0, .dqb_isoftlimit=0, .dqb_curinodes=0, .dqb_btime=0, .dqb_itime=0, .dqb_valid=15, .padding=0}}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;blockquote&gt;
&lt;p&gt;I suppose the backend is zfs, and the &quot;quota_iused_estimate&quot; is 0 (you can check it under the osd-zfs proc dir), right?&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;Yes.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# porteri /root &amp;gt; pdsh -w porter[1-16] &apos;cat /proc/fs/lustre/osd-zfs/*/quota_iused_estimate&apos; | dshbak -c
----------------
porter[1-16]
----------------
0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;blockquote&gt;
&lt;p&gt;The curinodes from OSTs will not be counted in the total inode usage at the end, though the number implies something is wrong. I guess the MDC was getting the same number too, is it possible to get some log with D_QUOTA enabled on the MDT or the OSTs which returning invalid number? Thanks.&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;I&apos;ll see if I can get some debug logs from the problem OSTs.&lt;/p&gt;</comment>
                            <comment id="68796" author="niu" created="Fri, 11 Oct 2013 02:55:29 +0000"  >&lt;p&gt;What&apos;s exact client &amp;amp; server version? client_quota_ctl() should only exist in 2.1 and earlier version.&lt;/p&gt;</comment>
                            <comment id="68859" author="prakash" created="Fri, 11 Oct 2013 20:16:19 +0000"  >&lt;p&gt;Sorry I haven&apos;t gotten any debug data pushed to you yet. Would that still be useful? And if so, from the MDT, OST, or both?&lt;/p&gt;

&lt;p&gt;The client version taken from the previous comment:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# sierra38 /root &amp;gt; cat /proc/fs/lustre/version 
lustre: 2.1.4
kernel: patchless_client
build:  2.1.4-5chaos-5chaos--PRISTINE-2.6.32-358.11.1.2chaos.ch5.1.x86_64
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;The server version:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# porter-mds1 /root &amp;gt; cat /proc/fs/lustre/version 
lustre: 2.4.0
kernel: patchless_client
build:  2.4.0-15chaos-15chaos--PRISTINE-2.6.32-358.14.1.2chaos.ch5.1.1.x86_64
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="68891" author="niu" created="Mon, 14 Oct 2013 02:04:55 +0000"  >&lt;p&gt;The bugous value returned from OST, the log on OST would be helpul, however, these inode usage values from OSTs will not be accounted, so I guess the value displayed in &apos;lfs quota&apos; output comes from MDT. Could you get logs from both MDT &amp;amp; OST? Thanks.&lt;/p&gt;</comment>
                            <comment id="70666" author="marc@llnl.gov" created="Mon, 4 Nov 2013 22:33:53 +0000"  >&lt;p&gt;I have attached the MDS logs generated after running this command:&lt;/p&gt;

&lt;ol&gt;
	&lt;li&gt;oslic1 /root &amp;gt; lfs quota -u  40186 /p/lscratche&lt;br/&gt;
Disk quotas for user 40186 (uid 40186):&lt;br/&gt;
     Filesystem  kbytes   quota   limit   grace   files   quota   limit   grace&lt;br/&gt;
   /p/lscratche      14       0       0       - 18446744073709551606       0       0       -&lt;/li&gt;
	&lt;li&gt;oslic1 /root &amp;gt;&lt;/li&gt;
&lt;/ol&gt;


&lt;p&gt;The OSS logs total 100MB compressed, so I can&apos;t upload them all at once.  If you want specific ones, or have an FTP site, I can get them to you.&lt;/p&gt;</comment>
                            <comment id="70697" author="niu" created="Tue, 5 Nov 2013 07:52:35 +0000"  >&lt;p&gt;Marc&lt;/p&gt;

&lt;p&gt;I have privately emailed you details of how to get us the logs&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="70731" author="marc@llnl.gov" created="Tue, 5 Nov 2013 16:14:59 +0000"  >&lt;p&gt;Thank you Peter.  I created an &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2619&quot; title=&quot;Bogus value of dqb_curinodes returned by osc_quotactl&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2619&quot;&gt;&lt;del&gt;LU-2619&lt;/del&gt;&lt;/a&gt; directory, and placed a file called &quot;porter_lustre_logs.tgz&quot;  It is about 115MB compressed.  Untarred, it will be about 2.4GB. Let me know if you need anything else.&lt;/p&gt;</comment>
                            <comment id="70825" author="niu" created="Wed, 6 Nov 2013 08:06:38 +0000"  >&lt;p&gt;Unfortunately, I didn&apos;t find any clue in the logs.&lt;/p&gt;

&lt;p&gt;Marc, could you apply the debug patch (&lt;a href=&quot;http://review.whamcloud.com/#/c/8191/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8191/&lt;/a&gt;) and try to get the log in following steps again? Thanks a lot.&lt;/p&gt;

&lt;p&gt;1. &apos;lctl clear&apos; on MDS and OSTs to clear the debug buffer;&lt;br/&gt;
2. enable D_QUOTA &amp;amp; D_TRACE on MDS and OSTs; (echo +quota &amp;gt; /proc/sys/lnet/debug; echo +trace &amp;gt; /proc/sys/lnet/debug);&lt;br/&gt;
3. &apos;lctl debug_daemon start $tmpfile 300&apos; on MDS and OSTs to start the debug daemon;&lt;br/&gt;
4. &apos;lctl mark &quot;======= lfs quota ======&quot;&apos; on MDS and OSTs to set a marker in debug log;&lt;br/&gt;
5. execute the lfs quota command which prints the bugous value;&lt;br/&gt;
6. &apos;lctl debug_daemon stop&apos; on MDS and OSTs to stop debug daemon;&lt;br/&gt;
7. &apos;lctl debug_file $tmpfile $logfile&apos; to convert binary logs into text files;&lt;br/&gt;
8. put the text log files in previoius step on ftp;&lt;/p&gt;</comment>
                            <comment id="70859" author="marc@llnl.gov" created="Wed, 6 Nov 2013 16:10:45 +0000"  >&lt;p&gt;Applying a patch will take a few weeks.  Is it useful to run the above steps without the patch?&lt;/p&gt;</comment>
                            <comment id="70942" author="niu" created="Thu, 7 Nov 2013 01:16:19 +0000"  >&lt;p&gt;It&apos;s better to apply the patch or you can use system tap to print these values in odd_acct_index_lookup(). &lt;/p&gt;</comment>
                            <comment id="71150" author="prakash" created="Fri, 8 Nov 2013 19:10:34 +0000"  >&lt;p&gt;Sigh.. Systemtap is failing me..&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# porter34 /root &amp;gt; stap -v TOSS-27.stp 
Pass 1: parsed user script and 91 library script(s) using 101264virt/26156res/2964shr/24060data kb, in 110usr/0sys/111real ms.
semantic error: failed to retrieve location attribute for &apos;osd&apos; (dieoffset: 0x8434c): identifier &apos;$osd&apos; at TOSS-27.stp:3:9
        source:                 @cast($osd, &quot;osd_device&quot;)-&amp;gt;od_svname$,
                                      ^

Pass 2: analyzed script: 1 probe(s), 7 function(s), 0 embed(s), 0 global(s) using 249680virt/34380res/6848shr/27132data kb, in 20usr/20sys/40real ms.
Pass 2: analysis failed.  Try again with another &apos;--vp 01&apos; option.
# porter34 /root &amp;gt; cat TOSS-27.stp 
probe module(&quot;osd-zfs&quot;).function(&quot;osd_acct_index_lookup&quot;).return {
        printf(&quot;%s: %s: id: %s, ispace: %u, bspace: %u\n&quot;, probefunc(),
                @cast($osd, &quot;osd_device&quot;)-&amp;gt;od_svname$,
                $buf, @cast($rec, &quot;lquota_acct_rec&quot;)-&amp;gt;ispace,
                @cast($rec, &quot;lquota_acct_rec&quot;)-&amp;gt;bspace);
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="71220" author="niu" created="Mon, 11 Nov 2013 07:00:43 +0000"  >&lt;p&gt;This problem happened on both 2.1.4 client 2.4 client, right? Is it possible to make a reproducer?&lt;/p&gt;</comment>
                            <comment id="71344" author="prakash" created="Tue, 12 Nov 2013 17:45:03 +0000"  >&lt;p&gt;Yes, we see the same behavior on 2.1 and 2.4 clients. The server is 2.4 only, though. I don&apos;t know if the same would happen on a 2.1 server. We have a reproducer, but I think it is dependent on the server returning a &quot;bad&quot; value. Perhaps we can try to reproduce this in a VM setup, using a &quot;fail_loc&quot; on the server to return a bogus value to the client? I haven&apos;t tried that, but it &lt;em&gt;might&lt;/em&gt; work.&lt;/p&gt;</comment>
                            <comment id="71388" author="niu" created="Wed, 13 Nov 2013 01:44:34 +0000"  >&lt;p&gt;what do you mean using a &apos;fail_loc&apos; on server to return a bogus value to client? I don&apos;t think server is expected to return a bad value.&lt;/p&gt;</comment>
                            <comment id="71458" author="prakash" created="Wed, 13 Nov 2013 19:42:22 +0000"  >&lt;p&gt;Well, I&apos;m still unsure where the bad value is coming from, but my guess is it&apos;s coming from the server. I could be wrong, though.&lt;/p&gt;

&lt;p&gt;I&apos;m assuming the bad &quot;dqb_curinodes&quot; values uncovered by the client systemtap script is coming from the server, is that not the case?&lt;/p&gt;</comment>
                            <comment id="71494" author="niu" created="Thu, 14 Nov 2013 01:23:49 +0000"  >&lt;blockquote&gt;
&lt;p&gt;I&apos;m assuming the bad &quot;dqb_curinodes&quot; values uncovered by the client systemtap script is coming from the server, is that not the case?&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;That&apos;s quite possible. I&apos;m just not sure the purpose of using a &apos;fail_loc&apos; on server to return bad value to client.&lt;/p&gt;</comment>
                            <comment id="88581" author="niu" created="Wed, 9 Jul 2014 13:02:53 +0000"  >&lt;p&gt;The bogus &apos;dqb_curinodes&apos; comes from OST, I&apos;m wondering how it can contribute to the &apos;files&apos; of &apos;lfs quota&apos; output, because we only collect inode usage on MDTs:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;                        &lt;span class=&quot;code-comment&quot;&gt;/* collect space usage from OSTs */&lt;/span&gt;
                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curspace = 0;
                        rc = obd_quotactl(sbi-&amp;gt;ll_dt_exp, oqctl_tmp);
                        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (!rc || rc == -EREMOTEIO) {
                                oqctl-&amp;gt;qc_dqblk.dqb_curspace =
                                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curspace;
                                oqctl-&amp;gt;qc_dqblk.dqb_valid |= QIF_SPACE;
                        }

                        &lt;span class=&quot;code-comment&quot;&gt;/* collect space &amp;amp; inode usage from MDTs */&lt;/span&gt;
                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curspace = 0;
                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curinodes = 0;
                        rc = obd_quotactl(sbi-&amp;gt;ll_md_exp, oqctl_tmp);
                        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (!rc || rc == -EREMOTEIO) {
                                oqctl-&amp;gt;qc_dqblk.dqb_curspace +=
                                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curspace;
                                oqctl-&amp;gt;qc_dqblk.dqb_curinodes =
                                        oqctl_tmp-&amp;gt;qc_dqblk.dqb_curinodes;
                                oqctl-&amp;gt;qc_dqblk.dqb_valid |= QIF_INODES;
                        } &lt;span class=&quot;code-keyword&quot;&gt;else&lt;/span&gt; {
                                oqctl-&amp;gt;qc_dqblk.dqb_valid &amp;amp;= ~QIF_SPACE;
                        }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I did some local testing that making OST to return fake &apos;curinodes&apos; to client, however, client ignored the fake value as expected.&lt;/p&gt;

&lt;p&gt;While investigating why server returns bogus value, I think I&apos;d verify the client code you running wasn&apos;t changed by some unexpected patch. Could you show me where to check the client code? (llnl tree? which tag?) Thank you.&lt;/p&gt;</comment>
                            <comment id="88595" author="prakash" created="Wed, 9 Jul 2014 14:57:29 +0000"  >&lt;p&gt;As always, our source and releases are on github: &lt;a href=&quot;https://github.com/chaos/lustre&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://github.com/chaos/lustre&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;As far as which releases were installed on the servers and clients in question, I&apos;ll have to ask the admins. Marc Stearman, can you double check this issue is still occurring on Sequoia and report back the version currently installed there?&lt;/p&gt;</comment>
                            <comment id="88603" author="marc@llnl.gov" created="Wed, 9 Jul 2014 15:21:20 +0000"  >&lt;p&gt;Yes it is still happening on all of our file systems, so the current tag will work for you.&lt;/p&gt;</comment>
                            <comment id="88627" author="morrone" created="Wed, 9 Jul 2014 18:06:35 +0000"  >&lt;p&gt;In other words, tag 2.4.2-13chaos.&lt;/p&gt;</comment>
                            <comment id="88672" author="niu" created="Thu, 10 Jul 2014 02:50:46 +0000"  >&lt;p&gt;Thank you, I didn&apos;t see any difference in client code.&lt;/p&gt;

&lt;p&gt;Looks the debug patch (&lt;a href=&quot;http://review.whamcloud.com/#/c/8191/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8191/&lt;/a&gt;) has been applied in the code, is it possible to capture server logs with D_QUOTA enabled? So we can see if the bogus value is returned from osd_acct_index_lookup().&lt;/p&gt;</comment>
                            <comment id="103286" author="marc@llnl.gov" created="Mon, 12 Jan 2015 23:11:56 +0000"  >&lt;p&gt;I enabled +quota debugging on the MDS.  Then I ran this command:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[root@surface86:~]# lfs quota -u weems2 /p/lscratche
Disk quotas for user weems2 (uid 59519):
     Filesystem  kbytes   quota   limit   grace   files   quota   limit   grace
   /p/lscratche      88       0       0       - 18446744073709551462       0       0       -
[root@surface86:~]# 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;You can see that the files column is very large.  I then dumped the debug logs on the MDS right after that:  These are the lines from the quota debugging:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00040000:04000000:5.0F:1421104120.034812:0:13022:0:(qmt_handler.c:65:qmt_get()) $$$ fetch settings qmt:lse-QMT0000 pool:0-md id:59519 enforced:0 hard:0 soft:0 granted:0 time:0 qunit:0 edquot:0 may_rel:0 revoke:0
00040000:04000000:5.0:1421104120.034818:0:13022:0:(qmt_handler.c:65:qmt_get()) $$$ fetch settings qmt:lse-QMT0000 pool:0-dt id:59519 enforced:0 hard:0 soft:0 granted:0 time:0 qunit:0 edquot:0 may_rel:0 revoke:0
00000001:04000000:4.0F:1421104120.068222:0:13022:0:(osd_quota.c:122:osd_acct_index_lookup()) lse-MDT0000: id:e87f, ispace:18446744073709551462, bspace:90112
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Do you need lines from OSTs as well, or just from the MDS?&lt;/p&gt;</comment>
                            <comment id="103306" author="niu" created="Tue, 13 Jan 2015 07:03:50 +0000"  >&lt;p&gt;From the log we can see the bogus value is from MDS, and it&apos;s read from the zap object which we created for inode accounting. Given that this problem happened only for inode accounting, I highly suspect it&apos;s related to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2435&quot; title=&quot;inode accounting in osd-zfs is racy&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2435&quot;&gt;&lt;del&gt;LU-2435&lt;/del&gt;&lt;/a&gt;. I think a temporary workaround is to set the quota_iused_estimate to 1.&lt;/p&gt;

&lt;blockquote&gt;
&lt;p&gt;Do you need lines from OSTs as well, or just from the MDS?&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;No, I think MDS log is enough. Thank you.&lt;/p&gt;</comment>
                            <comment id="103338" author="marc@llnl.gov" created="Tue, 13 Jan 2015 16:38:04 +0000"  >&lt;p&gt;Thanks, setting quota_iused_estimate to 1 reports a more realistic value:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[root@surface86:~]# lfs quota -u weems2 /p/lscratche
Disk quotas for user weems2 (uid 59519):
     Filesystem  kbytes   quota   limit   grace   files   quota   limit   grace
   /p/lscratche      88       0       0       -       1       0       0       -
[root@surface86:~]# 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I will watch the status of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2435&quot; title=&quot;inode accounting in osd-zfs is racy&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2435&quot;&gt;&lt;del&gt;LU-2435&lt;/del&gt;&lt;/a&gt;.  Are there any other downsides to setting quota_iused_estimate to 1?&lt;/p&gt;</comment>
                            <comment id="103731" author="niu" created="Fri, 16 Jan 2015 06:19:53 +0000"  >&lt;blockquote&gt;
&lt;p&gt;Are there any other downsides to setting quota_iused_estimate to 1&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;With quota_iused_estimate = 1, the reported inode accounting is calculated based on consumed space on MDT, it&apos;s not accurate as quota_iused_estimate = 0.&lt;/p&gt;</comment>
                            <comment id="104119" author="marc@llnl.gov" created="Tue, 20 Jan 2015 23:24:48 +0000"  >&lt;p&gt;I think this is a decent workaround for my purposes.  I&apos;m happy to close this one, and I will await a fix in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2435&quot; title=&quot;inode accounting in osd-zfs is racy&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2435&quot;&gt;&lt;del&gt;LU-2435&lt;/del&gt;&lt;/a&gt; that will allow us to scan the file system and fix broken ZAP entries.&lt;/p&gt;</comment>
                            <comment id="104124" author="pjones" created="Tue, 20 Jan 2015 23:38:31 +0000"  >&lt;p&gt;ok thanks Marc!&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="14304">LU-2435</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="13754" name="porter-mds1.txt.gz" size="132554" author="marc@llnl.gov" created="Mon, 4 Nov 2013 22:33:53 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvfav:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6124</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>