<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:14:29 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14988] crash in ll_migrate in racer</title>
                <link>https://jira.whamcloud.com/browse/LU-14988</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;&lt;a href=&quot;https://review.whamcloud.com/#/c/43964/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/43964/&lt;/a&gt; seems to cause a crash in ll_migrate similar to what was reported in now landed &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13157&quot; title=&quot;migrate symlink with target name length &amp;gt; 59 cause crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13157&quot;&gt;&lt;del&gt;LU-13157&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;very reproducable on recent master-next&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt; 
[ &#160;628.058780] LustreError: 25573:0:(ldlm_resource.c:1124:ldlm_resource_complain()) Skipped 23 previous similar messages
[ &#160;628.489874] LustreError: 14648:0:(osp_sync.c:1094:osp_sync_process_committed()) lustre-OST0003-osc-MDT0001: can&apos;t cancel 279 records: rc = -30
[ &#160;628.599298] LustreError: 14648:0:(osp_sync.c:1094:osp_sync_process_committed()) Skipped 15 previous similar messages
[ &#160;628.701810] Lustre: lustre-OST0000-osc-ffff88029a0e8008: Connection restored to 192.168.123.100@tcp (at 0@lo)
[ &#160;629.004000] LustreError: 14050:0:(osp_sync.c:1079:osp_sync_process_committed()) lustre-OST0001-osc-MDT0001: can&apos;t cancel record: rc = -30
[ &#160;629.035251] LustreError: 14050:0:(osp_sync.c:1079:osp_sync_process_committed()) Skipped 5 previous similar messages
[ &#160;630.287812] LustreError: 25548:0:(llite_lib.c:1836:ll_md_setattr()) md_setattr fails: rc = -30
[ &#160;630.894353] Lustre: mdt07_002: service thread pid 11113 was inactive for 66.027 seconds. Watchdog stack traces are limited to 3 per 300 seconds, skipping this one.[ &#160;630.930762] Lustre: Skipped 6 previous similar messages
[ &#160;631.237306] LustreError: 11-0: lustre-MDT0001-mdc-ffff88009e7fb7e8: operation ldlm_enqueue to node 0@lo failed: rc = -30
[ &#160;631.396604] LustreError: 25697:0:(llite_lib.c:1836:ll_md_setattr()) md_setattr fails: rc = -30
[ &#160;631.768361] LustreError: 25697:0:(llite_lib.c:1836:ll_md_setattr()) Skipped 1 previous similar message[ &#160;632.634314] BUG: unable to handle kernel NULL pointer dereference at 0000000000000008
[ &#160;632.658290] IP: [&amp;lt;ffffffffa1051e52&amp;gt;] ll_migrate+0x9b2/0xec0 [lustre]
[ &#160;632.660785] PGD 800000028b3a6067 PUD 28b3a7067 PMD 0 
[ &#160;632.662892] Oops: 0000 [#1] SMP DEBUG_PAGEALLOC
[ &#160;632.665067] Modules linked in: loop zfs(PO) zunicode(PO) zzstd(O) zlua(O) zcommon(PO) znvpair(PO) zavl(PO) icp(PO) spl(O) lustre(OE) ofd(OE) osp(OE) lod(OE) ost(OE) mdt(OE) mdd(OE) mgs(OE) osd_ldiskfs(OE) ldiskfs(OE) jbd2 mbcache lquota(OE) lfsck(OE) obdecho(OE) mgc(OE) mdc(OE) lov(OE) osc(OE) lmv(OE) fid(OE) fld(OE) ptlrpc_gss(OE) ptlrpc(OE) obdclass(OE) ksocklnd(OE) lnet(OE) dm_flakey dm_mod libcfs(OE) crc_t10dif crct10dif_generic sb_edac edac_core iosf_mbi crc32_pclmul ghash_clmulni_intel aesni_intel lrw gf128mul glue_helper ablk_helper cryptd virtio_balloon virtio_console pcspkr i2c_piix4 ip_tables rpcsec_gss_krb5 drm_kms_helper ttm ata_generic pata_acpi drm crct10dif_pclmul crct10dif_common crc32c_intel drm_panel_orientation_quirks ata_piix serio_raw virtio_blk i2c_core libata floppy[ &#160;632.698829] CPU: 6 PID: 25076 Comm: lfs Kdump: loaded Tainted: P &#160;&#160;&#160;&#160;&#160;&#160;&#160;W &#160;OE &#160;------------ &#160;&#160;3.10.0-7.9-debug #2
[ &#160;632.701212] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[ &#160;632.702454] task: ffff8802912324f0 ti: ffff88024ad2c000 task.ti: ffff88024ad2c000
[ &#160;632.705158] RIP: 0010:[&amp;lt;ffffffffa1051e52&amp;gt;] &#160;[&amp;lt;ffffffffa1051e52&amp;gt;] ll_migrate+0x9b2/0xec0 [lustre]
[ &#160;632.708792] RSP: 0018:ffff88024ad2fbc8 &#160;EFLAGS: 00010206[ &#160;632.710770] RAX: 0000000000000000 RBX: ffff880253c01458 RCX: 0000000000000000
[ &#160;632.713070] RDX: 0000000000000000 RSI: ffff880327331138 RDI: ffff880327331118
[ &#160;632.715401] RBP: ffff88024ad2fc48 R08: ffff8802668e2058 R09: 0000000000000001
[ &#160;632.717769] R10: 0000000000000000 R11: ffff88024ad2f5e6 R12: 0000000000000000
[ &#160;632.720049] R13: ffff8800848d48e8 R14: ffff88029b7166d8 R15: 0000000000000030
[ &#160;632.722352] FS: &#160;00007fa279316740(0000) GS:ffff880331b80000(0000) knlGS:0000000000000000
[ &#160;632.781764] CS: &#160;0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ &#160;632.784011] CR2: 0000000000000008 CR3: 0000000266662000 CR4: 00000000001607e0
[ &#160;632.786316] Call Trace:
[ &#160;632.788315] &#160;[&amp;lt;ffffffff81242213&amp;gt;] ? __check_object_size+0x1c3/0x220
[ &#160;632.790913] &#160;[&amp;lt;ffffffffa103f561&amp;gt;] ll_dir_ioctl+0x5d01/0x6ed0 [lustre]
[ &#160;632.793261] &#160;[&amp;lt;ffffffff81411979&amp;gt;] ? do_raw_spin_unlock+0x49/0x90
[ &#160;632.795476] &#160;[&amp;lt;ffffffff8115260f&amp;gt;] ? delayacct_end+0x8f/0xb0
[ &#160;632.817827] &#160;[&amp;lt;ffffffff81152744&amp;gt;] ? __delayacct_blkio_end+0x34/0x60
[ &#160;632.820259] &#160;[&amp;lt;ffffffff817e0257&amp;gt;] ? io_schedule_timeout+0xe7/0x130
[ &#160;632.822620] &#160;[&amp;lt;ffffffff811b62dd&amp;gt;] ? find_get_pages_tag+0x10d/0x260
[ &#160;632.824759] &#160;[&amp;lt;ffffffff811c3691&amp;gt;] ? pagevec_lookup_tag+0x21/0x30
[ &#160;632.827037] &#160;[&amp;lt;ffffffff811b400e&amp;gt;] ? __filemap_fdatawait_range+0xbe/0x1a0
[ &#160;632.830403] &#160;[&amp;lt;ffffffff8125b3fd&amp;gt;] do_vfs_ioctl+0x40d/0x6c0
[ &#160;632.833084] &#160;[&amp;lt;ffffffff81264d2b&amp;gt;] ? iput+0x3b/0x180
[ &#160;632.835354] &#160;[&amp;lt;ffffffff8125b751&amp;gt;] SyS_ioctl+0xa1/0xc0
[ &#160;632.838391] &#160;[&amp;lt;ffffffff817ee00c&amp;gt;] system_call_fastpath+0x1f/0x24[ &#160;632.840775] Code: 03 49 89 45 50 48 8b 44 24 38 49 89 85 38 01 00 00 48 8b 43 20 41 81 8d 30 01 00 00 00 20 00 00 49 89 85 40 01 00 00 48 8b 43 18 &amp;lt;48&amp;gt; 8b 78 08 48 83 c7 18 e8 b1 13 79 e0 48 8b 43 18 48 8b 40 08 [ &#160;632.884740] RIP &#160;[&amp;lt;ffffffffa1051e52&amp;gt;] ll_migrate+0x9b2/0xec0 [lustre]
[ &#160;632.891978] &#160;RSP &amp;lt;ffff88024ad2fbc8&amp;gt;
[ &#160;632.912110] CR2: 0000000000000008&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="65953">LU-14988</key>
            <summary>crash in ll_migrate in racer</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="green">Oleg Drokin</reporter>
                        <labels>
                    </labels>
                <created>Tue, 7 Sep 2021 10:04:36 +0000</created>
                <updated>Tue, 29 Aug 2023 22:54:20 +0000</updated>
                                            <version>Lustre 2.15.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="313418" author="gerrit" created="Mon, 20 Sep 2021 16:10:29 +0000"  >&lt;p&gt;&lt;del&gt;&quot;James Nunez &amp;lt;jnunez@whamcloud.com&amp;gt;&quot; uploaded a new patch:&lt;/del&gt; &lt;a href=&quot;https://review.whamcloud.com/44992&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/44992&lt;/a&gt;&lt;br/&gt;
&lt;del&gt;Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14988&quot; title=&quot;crash in ll_migrate in racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14988&quot;&gt;LU-14988&lt;/a&gt; tests: racer overstripe crash&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Project: fs/lustre-release&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Branch: master&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Current Patch Set: 1&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Commit: 720a1c5dfa58236b7c3ca8f57c6f7d4862d16284&lt;/del&gt;&lt;/p&gt;</comment>
                            <comment id="315323" author="spitzcor" created="Tue, 12 Oct 2021 17:46:28 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=jamesanunez&quot; class=&quot;user-hover&quot; rel=&quot;jamesanunez&quot;&gt;jamesanunez&lt;/a&gt;, what&apos;s going on with &lt;a href=&quot;https://review.whamcloud.com/#/c/44992/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/44992/&lt;/a&gt; ?  Any news?  I think &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14754&quot; title=&quot;add Overstripe support to racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14754&quot;&gt;&lt;del&gt;LU-14754&lt;/del&gt;&lt;/a&gt; has been waiting on this to shake out, but there is nothing wrong with that test patch.  If that test is bringing out this issue it is all the more reason to land it, don&apos;t you think?&lt;/p&gt;</comment>
                            <comment id="315361" author="adilger" created="Wed, 13 Oct 2021 01:26:34 +0000"  >&lt;p&gt;Cory,&lt;br/&gt;
it&apos;s true that the new test has brought out this new issue, and there is nothing particularly &quot;wrong&quot; with the patch itself, but I disagree that this implies the patch should land immediately.  If that were to happen, then all or many racer test runs would trigger this same assertion, and we&apos;d be flooded with a sea of test failures, potentially hiding other regressions that may be introduced in the meantime because it is hard to distinguish the existing &quot;FAIL&quot; or &quot;TIMEOUT&quot; from some new &quot;FAIL&quot;, even if the root causes are different. &lt;/p&gt;

&lt;p&gt;Rather than landing the new test patch as-is, the new defect that the new test patch found needs to be fixed, verify that the new test is now passing, and then land both of them.&lt;/p&gt;</comment>
                            <comment id="315698" author="egryaznova" created="Fri, 15 Oct 2021 14:38:11 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=adilger&quot; class=&quot;user-hover&quot; rel=&quot;adilger&quot;&gt;adilger&lt;/a&gt;,&lt;br/&gt;
will the following change help to land the patch ?&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
--- a/lustre/tests/racer.sh
+++ b/lustre/tests/racer.sh
@@ -70,7 +70,8 @@ RACER_ENABLE_PFL=${RACER_ENABLE_PFL:-&lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;}
 RACER_ENABLE_DOM=${RACER_ENABLE_DOM:-&lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;}
 RACER_ENABLE_FLR=${RACER_ENABLE_FLR:-&lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;}
 RACER_ENABLE_SEL=${RACER_ENABLE_SEL:-&lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;}
-RACER_ENABLE_OVERSTRIPE=${RACER_ENABLE_OVERSTRIPE:-&lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;}
+# set &lt;span class=&quot;code-keyword&quot;&gt;false&lt;/span&gt;, LU-14988
+RACER_ENABLE_OVERSTRIPE=${RACER_ENABLE_OVERSTRIPE:-&lt;span class=&quot;code-keyword&quot;&gt;false&lt;/span&gt;}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="315769" author="adilger" created="Sat, 16 Oct 2021 06:24:06 +0000"  >&lt;p&gt;Definitely yes. That will allow the functionality to be landed, without it being enabled. &lt;/p&gt;</comment>
                            <comment id="315770" author="egryaznova" created="Sat, 16 Oct 2021 06:49:41 +0000"  >&lt;p&gt;Thank you, Andreas.&lt;br/&gt;
Patch is updated.&lt;/p&gt;</comment>
                            <comment id="369552" author="adilger" created="Fri, 14 Apr 2023 22:49:02 +0000"  >&lt;p&gt;The next step for this issue would be to push a patch that changes:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;-RACER_ENABLE_OVERSTRIPE=${RACER_ENABLE_OVERSTRIPE:-false}
+RACER_ENABLE_OVERSTRIPE=${RACER_ENABLE_OVERSTRIPE:-true}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;and then add enough &quot;&lt;tt&gt;Test-Parameters: testlist=racer env=DURATION=900&lt;/tt&gt;&quot; runs to determine if the overstriping is still causing new failures or not.  In the past 4 weeks on master there have been 479 racer runs, with 4 FAIL, 8 CRASH, 1 TIMEOUT:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.whamcloud.com/search?client_branch_type_id=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;server_branch_type_id=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;horizon=2332800&amp;amp;status%5B%5D=FAIL&amp;amp;status%5B%5D=TIMEOUT&amp;amp;status%5B%5D=CRASH&amp;amp;test_set_script_id=9ab2e9f8-6aec-11e0-b32b-52540025f9af&amp;amp;sub_test_script_id=12c874f8-c308-11e0-9a20-52540025f9af&amp;amp;source=sub_tests#redirect&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/search?client_branch_type_id=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;server_branch_type_id=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;horizon=2332800&amp;amp;status%5B%5D=FAIL&amp;amp;status%5B%5D=TIMEOUT&amp;amp;status%5B%5D=CRASH&amp;amp;test_set_script_id=9ab2e9f8-6aec-11e0-b32b-52540025f9af&amp;amp;sub_test_script_id=12c874f8-c308-11e0-9a20-52540025f9af&amp;amp;source=sub_tests#redirect&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;So that is about 1/37 ~= 2.7% failure rate, so running a handful of &lt;tt&gt;racer&lt;/tt&gt; runs would tell us first if this crash is still present/common, and then about 100 total runs would tell us if this induces more failures, or if it can be re-enabled by default (presumably bug has since been fixed).&lt;/p&gt;</comment>
                            <comment id="384135" author="gerrit" created="Tue, 29 Aug 2023 22:53:42 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/52169&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/52169&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14988&quot; title=&quot;crash in ll_migrate in racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14988&quot;&gt;LU-14988&lt;/a&gt; tests: enable overstripe in racer&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: c9069855175d5807f63db93ada1ecd5760722b39&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="57839">LU-13157</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="77562">LU-17048</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="64619">LU-14754</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i023nj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>