<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:43:24 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-4515] Test failure sanity-quota test_34: Used space for user 60000 is 0, expected 2048</title>
                <link>https://jira.whamcloud.com/browse/LU-4515</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Nathaniel Clark &amp;lt;nathaniel.l.clark@intel.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run:&lt;br/&gt;
&lt;a href=&quot;http://maloo.whamcloud.com/test_sets/0c69b0d8-7e9d-11e3-b6d1-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://maloo.whamcloud.com/test_sets/0c69b0d8-7e9d-11e3-b6d1-52540035b04c&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/e355e8f2-8148-11e3-81ba-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/e355e8f2-8148-11e3-81ba-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;The sub-test test_34 failed with the following error:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;Used space for user 60000 is 0, expected 2048&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;Info required for matching: sanity-quota 34&lt;/p&gt;</description>
                <environment></environment>
        <key id="22817">LU-4515</key>
            <summary>Test failure sanity-quota test_34: Used space for user 60000 is 0, expected 2048</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="niu">Niu Yawei</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Mon, 20 Jan 2014 19:35:13 +0000</created>
                <updated>Thu, 2 Oct 2014 21:18:07 +0000</updated>
                            <resolved>Fri, 4 Jul 2014 18:26:21 +0000</resolved>
                                    <version>Lustre 2.6.0</version>
                                    <fixVersion>Lustre 2.6.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>11</watches>
                                                                            <comments>
                            <comment id="75518" author="jlevi" created="Thu, 23 Jan 2014 18:39:26 +0000"  >&lt;p&gt;Niu,&lt;br/&gt;
Could you please take a look at this one?&lt;br/&gt;
Thank you!&lt;/p&gt;</comment>
                            <comment id="75525" author="adilger" created="Thu, 23 Jan 2014 19:51:03 +0000"  >&lt;p&gt;I would suspect this is a regression in a patch that landed recently.  The problem only appeared on 2014-01-16, so failing tests should be checked for the earliest parent that is common to all of the test failures (probably landed within a day of the start of tests failing).&lt;/p&gt;

&lt;p&gt;I also wrote a small fixup to the sanity-quota.sh test script because it was spewing a lot of garbage into the logs: &lt;a href=&quot;http://review.whamcloud.com/8978&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8978&lt;/a&gt;  Note that this is NOT a fix to the problem reported here.&lt;/p&gt;</comment>
                            <comment id="75528" author="adilger" created="Thu, 23 Jan 2014 20:25:22 +0000"  >&lt;p&gt;I did some digging into the test failures, and the earliest failures were hit with parent commit 035f3e4bf7532839dd88a4ae330fd67542e17cdd (&lt;a href=&quot;http://review.whamcloud.com/8528&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8528&lt;/a&gt;) but I don&apos;t think that patch is the source of the problem.  Nothing similar was hit in the two weeks prior to this.&lt;/p&gt;</comment>
                            <comment id="75529" author="adilger" created="Thu, 23 Jan 2014 22:14:37 +0000"  >&lt;p&gt;I was looking at the debug logs for &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/0c69b0d8-7e9d-11e3-b6d1-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/0c69b0d8-7e9d-11e3-b6d1-52540035b04c&lt;/a&gt; and it appears that the &quot;&lt;tt&gt;chown&lt;/tt&gt;&quot; RPC (&quot;&lt;tt&gt;MDS_REINT&lt;/tt&gt;&quot;) is sent to the MDS, but no matching &quot;&lt;tt&gt;OST_SETATTR&lt;/tt&gt;&quot; RPC is sent to the OST to change the object ownership.  I also see in the logs:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;1389835717.361895:0:4338:0:(osd_quota.c:98:osd_acct_index_lookup()) lustre-MDT0000: id ea60 not found in DMU accounting ZAP
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;which indicates to me (a non quota expert) that this user (0xea60=60000) doesn&apos;t have any files in quota accounting.&lt;/p&gt;</comment>
                            <comment id="75533" author="yong.fan" created="Fri, 24 Jan 2014 00:23:52 +0000"  >&lt;p&gt;Niu: I have submitted a patch (&lt;a href=&quot;http://review.whamcloud.com/#/c/8981/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8981/&lt;/a&gt;) to disable sanity-quota &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4515&quot; title=&quot;Test failure sanity-quota test_34: Used space for user 60000 is 0, expected 2048&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4515&quot;&gt;&lt;del&gt;LU-4515&lt;/del&gt;&lt;/a&gt; to avoid other patches to be failed for this bug. Please enable it when you submit patch to fix related issues. Thanks!&lt;/p&gt;</comment>
                            <comment id="75545" author="johann" created="Fri, 24 Jan 2014 09:30:16 +0000"  >&lt;p&gt;The lack of OST_SETATTR requests is weird. The test relies on wait_delete_completed to wait for setattr RPCs to be sent, is it possible that this function does not work any more for setattr?&lt;/p&gt;</comment>
                            <comment id="75546" author="bobijam" created="Fri, 24 Jan 2014 09:30:41 +0000"  >&lt;p&gt;from client ll_setattr_raw(), after it set attr on MDS, client only set ost attr for size &amp;amp; time change, won&apos;t do anything about uid change on OST.&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (attr-&amp;gt;ia_valid &amp;amp; (ATTR_SIZE |
                              ATTR_ATIME | ATTR_ATIME_SET |
                              ATTR_MTIME | ATTR_MTIME_SET)) {
                /* For truncate and utimes sending attributes to OSTs, setting
                 * mtime/atime to the past will be performed under PW [0:EOF]
                 * extent lock (new_size:EOF &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; truncate).  It may seem
                 * excessive to send mtime/atime updates to OSTs when not
                 * setting times to past, but it is necessary due to possible
                 * time de-synchronization between MDT inode and OST objects */
                rc = ll_setattr_ost(inode, attr);
        }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I verified this behavior on ldiskfs backend, and the test passed for ldiskfs backend. From what&apos;s been observed, it likely relates to the quota implementation with zfs backend.&lt;/p&gt;</comment>
                            <comment id="75547" author="johann" created="Fri, 24 Jan 2014 09:44:04 +0000"  >&lt;p&gt;Bobijam, since 2.4, this is the MDT which is responsible for sending the OST_SETATTR RPCs to change ownership of objects on the OSTs. This is done through OSP and that&apos;s why the test calls wait_delete_completed to wait for OSP to flush all pending requests.&lt;/p&gt;</comment>
                            <comment id="75567" author="bogl" created="Fri, 24 Jan 2014 17:48:34 +0000"  >&lt;p&gt;As Johann said the test depends on wait_delete_completed to operate correctly.  wait_delete_completed relies on lproc stats maintained in osp_sync.c.  I see &lt;a href=&quot;http://review.whamcloud.com/7158&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/7158&lt;/a&gt; landed that touches osp code just about the time these errors started up.  I don&apos;t see anything wrong in that mod, but it does make changes in the close neighborhood and the coincidence in time seems suspicious.&lt;/p&gt;</comment>
                            <comment id="75678" author="jlevi" created="Mon, 27 Jan 2014 15:19:10 +0000"  >&lt;p&gt;Test has been disabled. Will re-enable once fix is in place.&lt;/p&gt;</comment>
                            <comment id="75694" author="utopiabound" created="Mon, 27 Jan 2014 18:10:48 +0000"  >&lt;p&gt;Jodi, how has this test been disabled?  Could this be related to issues with TEI-1403?&lt;/p&gt;</comment>
                            <comment id="77327" author="niu" created="Wed, 19 Feb 2014 06:59:14 +0000"  >&lt;p&gt;I saw this on the mds log before s-q test_34:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;Lustre: DEBUG MARKER: mkdir -p /mnt/mds1; mount -t lustre -o user_xattr,acl  		                   lustre-mdt1/mdt1 /mnt/mds1
------------[ cut here ]------------
WARNING: at fs/proc/&lt;span class=&quot;code-keyword&quot;&gt;generic&lt;/span&gt;.c:590 proc_register+0x129/0x220() (Tainted: P        W  ---------------   )
Hardware name: KVM
proc_dir_entry &lt;span class=&quot;code-quote&quot;&gt;&apos;lustre/osc&apos;&lt;/span&gt; already registered
Modules linked in: osp(U) mdd(U) lfsck(U) lod(U) mdt(U) mgs(U) mgc(U) nodemap(U) osd_zfs(U) lquota(U) lustre(U) lov(U) mdc(U) fid(U) fld(U) ksocklnd(U) ptlrpc(U) obdclass(U) lnet(U) sha512_generic sha256_generic libcfs(U) nfsd exportfs autofs4 nfs lockd fscache auth_rpcgss nfs_acl sunrpc ib_ipoib rdma_ucm ib_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_addr ipv6 ib_sa ib_mad ib_core zfs(P)(U) zcommon(P)(U) znvpair(P)(U) zavl(P)(U) zunicode(P)(U) spl(U) zlib_deflate microcode virtio_balloon 8139too 8139cp mii i2c_piix4 i2c_core ext3 jbd mbcache virtio_blk virtio_pci virtio_ring virtio pata_acpi ata_generic ata_piix dm_mirror dm_region_hash dm_log dm_mod [last unloaded: speedstep_lib]
Pid: 26088, comm: llog_process_th Tainted: P        W  ---------------    2.6.32-358.23.2.el6_lustre.ge80a1ca.x86_64 #1
Call Trace:
 [&amp;lt;ffffffff8106e3e7&amp;gt;] ? warn_slowpath_common+0x87/0xc0
 [&amp;lt;ffffffff8106e4d6&amp;gt;] ? warn_slowpath_fmt+0x46/0x50
 [&amp;lt;ffffffff811f0299&amp;gt;] ? proc_register+0x129/0x220
 [&amp;lt;ffffffff811f05c2&amp;gt;] ? proc_mkdir_mode+0x42/0x60
 [&amp;lt;ffffffff811f05f6&amp;gt;] ? proc_mkdir+0x16/0x20
 [&amp;lt;ffffffffa0718c00&amp;gt;] ? lprocfs_seq_register+0x20/0x80 [obdclass]
 [&amp;lt;ffffffffa070a203&amp;gt;] ? class_search_type+0x53/0xa0 [obdclass]
 [&amp;lt;ffffffffa1098f0a&amp;gt;] ? osp_lprocfs_init+0x30a/0x530 [osp]
 [&amp;lt;ffffffffa1085c3a&amp;gt;] ? osp_device_alloc+0xfaa/0x29e0 [osp]
 [&amp;lt;ffffffffa0746263&amp;gt;] ? lu_context_init+0xa3/0x240 [obdclass]
 [&amp;lt;ffffffffa072ce2f&amp;gt;] ? obd_setup+0x1bf/0x290 [obdclass]
 [&amp;lt;ffffffffa072d108&amp;gt;] ? class_setup+0x208/0x870 [obdclass]
 [&amp;lt;ffffffffa073567c&amp;gt;] ? class_process_config+0xc6c/0x1ad0 [obdclass]
 [&amp;lt;ffffffffa072e263&amp;gt;] ? lustre_cfg_new+0x2d3/0x6e0 [obdclass]
 [&amp;lt;ffffffffa07375fb&amp;gt;] ? class_config_llog_handler+0xa2b/0x1880 [obdclass]
 [&amp;lt;ffffffff8150faee&amp;gt;] ? mutex_lock+0x1e/0x50
 [&amp;lt;ffffffffa06f3d5b&amp;gt;] ? llog_process_thread+0x8ab/0xd60 [obdclass]
 [&amp;lt;ffffffffa0741e4f&amp;gt;] ? keys_fill+0x6f/0x190 [obdclass]
 [&amp;lt;ffffffffa06f4255&amp;gt;] ? llog_process_thread_daemonize+0x45/0x70 [obdclass]
 [&amp;lt;ffffffffa06f4210&amp;gt;] ? llog_process_thread_daemonize+0x0/0x70 [obdclass]
 [&amp;lt;ffffffff81096a36&amp;gt;] ? kthread+0x96/0xa0
 [&amp;lt;ffffffff8100c0ca&amp;gt;] ? child_rip+0xa/0x20
 [&amp;lt;ffffffff810969a0&amp;gt;] ? kthread+0x0/0xa0
 [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
---[ end trace f9bd04d09a084708 ]---
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Looks there is something wrong with the osp proc files, which makes wait_delete_completed() out of work.&lt;/p&gt;

&lt;p&gt;This should be introduced by &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3319&quot; title=&quot;Adapt to 3.10 upstream kernel proc_dir_entry change&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3319&quot;&gt;&lt;del&gt;LU-3319&lt;/del&gt;&lt;/a&gt;. Given that the patch &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3319&quot; title=&quot;Adapt to 3.10 upstream kernel proc_dir_entry change&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3319&quot;&gt;&lt;del&gt;LU-3319&lt;/del&gt;&lt;/a&gt; procfs: move osp proc handling to seq_files&quot; (which exactly caused this problem) has been reverted, I think we can add back test_34 now.&lt;/p&gt;</comment>
                            <comment id="77354" author="simmonsja" created="Wed, 19 Feb 2014 14:35:20 +0000"  >&lt;p&gt;The revert helped but a module loading race condition still exist when both client and server are on the same node. A patch exist to fix that issue at &lt;a href=&quot;http://review.whamcloud.com/#/c/9038&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9038&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="82418" author="adilger" created="Thu, 24 Apr 2014 17:43:36 +0000"  >&lt;p&gt;Niu, we still need a test to remove test_34 from sanity-quota.sh ALWAYS_EXCEPT.  Please just delete that ALWAYS_EXCEPT line, since these exceptions should be added at the top of the function where ALWAYS_EXCEPT is first defined.&lt;/p&gt;</comment>
                            <comment id="83521" author="jlevi" created="Thu, 8 May 2014 15:20:40 +0000"  >&lt;p&gt;Patch landed to Master. Please reopen ticket if more work is needed.&lt;/p&gt;</comment>
                            <comment id="88068" author="niu" created="Thu, 3 Jul 2014 04:35:35 +0000"  >&lt;p&gt; &lt;a href=&quot;http://review.whamcloud.com/10957&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/10957&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="88069" author="niu" created="Thu, 3 Jul 2014 04:36:28 +0000"  >&lt;p&gt;The test_34 need be re-enabled.&lt;/p&gt;</comment>
                            <comment id="88209" author="adilger" created="Fri, 4 Jul 2014 18:21:41 +0000"  >&lt;p&gt;We can&apos;t enable sanity-quota test_34 until the test is fixed by &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5296&quot; title=&quot;lod_attr_set() skips attr_set on osp objects incorrectly&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5296&quot;&gt;&lt;del&gt;LU-5296&lt;/del&gt;&lt;/a&gt; patch &lt;a href=&quot;http://review.whamcloud.com/10989&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/10989&lt;/a&gt; &lt;/p&gt;</comment>
                            <comment id="88210" author="adilger" created="Fri, 4 Jul 2014 18:26:21 +0000"  >&lt;p&gt;Closing this bug again.  I&apos;ve moved the re-enabling of test_34 into &lt;a href=&quot;http://review.whamcloud.com/10989&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/10989&lt;/a&gt; so that this patch is being verified as fixed.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="25439">LU-5296</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="22811">LU-4511</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwd9j:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>12354</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>