<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:32:11 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-17048] Crash in lod_declare_update_extents</title>
                <link>https://jira.whamcloud.com/browse/LU-17048</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;After additional testing was added to racer for migration and mirroring (not sure which exactly is the culprint here), patches: &lt;a href=&quot;https://review.whamcloud.com/13669&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/13669&lt;/a&gt; and &lt;a href=&quot;https://review.whamcloud.com/41368&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/41368&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;a frequent crash cropped up:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt; [ 6876.856207] BUG: unable to handle kernel NULL pointer dereference at 0000000000000006
[ 6876.857009] IP: [&amp;lt;ffffffffa0f50aa6&amp;gt;] lod_declare_update_extents.isra.57+0x86/0x1910 [lod]
[ 6876.857009] PGD 2aab7d067 PUD 322652067 PMD 0 
[ 6876.857009] Oops: 0000 [#1] SMP DEBUG_PAGEALLOC
[ 6876.857009] Modules linked in: lustre(OE) ofd(OE) osp(OE) lod(OE) ost(OE) mdt(OE) mdd(OE) mgs(OE) osd_ldiskfs(OE) ldiskfs(OE) lquota(OE) lfsck(OE) obdecho(OE) mgc(OE) mdc(OE) lov(OE) osc(OE) lmv(OE) fid(OE) fld(OE) ptlrpc_gss(OE) ptlrpc(OE) obdclass(OE) ksocklnd(OE) lnet(OE) dm_flakey dm_mod libcfs(OE) loop zfs(PO) zunicode(PO) zlua(PO) zcommon(PO) znvpair(PO) zavl(PO) icp(PO) spl(O) jbd2 mbcache crc32_generic crc_t10dif crct10dif_generic crct10dif_common virtio_console virtio_balloon pcspkr i2c_piix4 ip_tables rpcsec_gss_krb5 ata_generic pata_acpi drm_kms_helper ttm drm ata_piix drm_panel_orientation_quirks serio_raw virtio_blk libata i2c_core floppy [last unloaded: libcfs]
[ 6876.866880] CPU: 11 PID: 5226 Comm: mdt05_000 Kdump: loaded Tainted: P           OE  ------------   3.10.0-7.9-debug #2
[ 6876.866880] Hardware name: Red Hat KVM, BIOS 1.16.0-3.module_el8.7.0+1218+f626c2ff 04/01/2014
[ 6876.866880] task: ffff8800a5780010 ti: ffff88028bde8000 task.ti: ffff88028bde8000
[ 6876.866880] RIP: 0010:[&amp;lt;ffffffffa0f50aa6&amp;gt;]  [&amp;lt;ffffffffa0f50aa6&amp;gt;] lod_declare_update_extents.isra.57+0x86/0x1910 [lod]
[ 6876.866880] RSP: 0018:ffff88028bdeb738  EFLAGS: 00010246
[ 6876.866880] RAX: 0000000000000000 RBX: ffff8802a92d9b40 RCX: ffff8802a28d6378
[ 6876.866880] RDX: ffff880079bc3ef8 RSI: ffffffffa0f812e0 RDI: ffff880323d607d8
[ 6876.866880] RBP: ffff88028bdeb830 R08: 0000000000000000 R09: 0000000000000000
[ 6876.866880] R10: 0000000000000000 R11: 0000000000000000 R12: ffff88026c882e98
[ 6876.866880] R13: ffff8800a29c0ff8 R14: ffff880323d607d8 R15: ffff8802a92d9b40
[ 6876.866880] FS:  0000000000000000(0000) GS:ffff880331cc0000(0000) knlGS:0000000000000000
[ 6876.866880] CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
[ 6876.866880] CR2: 0000000000000006 CR3: 00000002ad280000 CR4: 00000000000007e0
[ 6876.866880] Call Trace:
[ 6876.882318]  [&amp;lt;ffffffffa0c0a1d0&amp;gt;] ? osd_trans_create+0xa0/0x690 [osd_ldiskfs]
[ 6876.882318]  [&amp;lt;ffffffffa03ecf88&amp;gt;] ? lu_buf_alloc+0x58/0x320 [obdclass]
[ 6876.882318]  [&amp;lt;ffffffffa0c0a1d0&amp;gt;] ? osd_trans_create+0xa0/0x690 [osd_ldiskfs]
[ 6876.882318]  [&amp;lt;ffffffffa0f34098&amp;gt;] ? lod_striping_load+0x98/0x6c0 [lod]
[ 6876.884562]  [&amp;lt;ffffffffa0f592aa&amp;gt;] lod_declare_update_plain+0x56a/0x980 [lod]
[ 6876.884562]  [&amp;lt;ffffffff8122054f&amp;gt;] ? __kmalloc+0x1ef/0x370
[ 6876.884562]  [&amp;lt;ffffffffa0f5b83e&amp;gt;] lod_declare_layout_change+0x69e/0xba0 [lod]
[ 6876.884562]  [&amp;lt;ffffffffa03ecfa1&amp;gt;] ? lu_buf_alloc+0x71/0x320 [obdclass]
[ 6876.884562]  [&amp;lt;ffffffffa0dd339b&amp;gt;] mdd_declare_layout_change+0x4b/0x100 [mdd]
[ 6876.884562]  [&amp;lt;ffffffffa0dde491&amp;gt;] mdd_layout_change+0xd91/0x1bc0 [mdd]
[ 6876.884562]  [&amp;lt;ffffffffa0e3db3f&amp;gt;] mdt_layout_change+0x2bf/0x450 [mdt]
[ 6876.884562]  [&amp;lt;ffffffffa0e444f0&amp;gt;] mdt_intent_layout+0x910/0xeb0 [mdt]
[ 6876.884562]  [&amp;lt;ffffffffa0e3b4fc&amp;gt;] mdt_intent_opc+0x1dc/0xc40 [mdt]
[ 6876.884562]  [&amp;lt;ffffffffa0e43be0&amp;gt;] ? mdt_intent_open+0x480/0x480 [mdt]
[ 6876.884562]  [&amp;lt;ffffffffa0e4134a&amp;gt;] mdt_intent_policy+0xfa/0x460 [mdt]
[ 6876.884562]  [&amp;lt;ffffffffa06941b1&amp;gt;] ldlm_lock_enqueue+0x3b1/0xbb0 [ptlrpc]
[ 6876.884562]  [&amp;lt;ffffffffa01c0f05&amp;gt;] ? cfs_hash_rw_unlock+0x15/0x20 [libcfs]
[ 6876.884562]  [&amp;lt;ffffffffa01c4186&amp;gt;] ? cfs_hash_add+0xa6/0x180 [libcfs]
[ 6876.884562]  [&amp;lt;ffffffffa06bc4e5&amp;gt;] ldlm_handle_enqueue+0x375/0x17d0 [ptlrpc]
[ 6876.884562]  [&amp;lt;ffffffffa063ca00&amp;gt;] ? lustre_msg_buf_v2+0x1e0/0x1f0 [ptlrpc]
[ 6876.884562]  [&amp;lt;ffffffffa06fe958&amp;gt;] tgt_enqueue+0x68/0x240 [ptlrpc]
[ 6876.894516]  [&amp;lt;ffffffffa0708f8e&amp;gt;] tgt_request_handle+0x88e/0x19b0 [ptlrpc]
[ 6876.894784]  [&amp;lt;ffffffffa064ebb1&amp;gt;] ptlrpc_server_handle_request+0x251/0xc00 [ptlrpc]
[ 6876.894784]  [&amp;lt;ffffffffa06508c6&amp;gt;] ptlrpc_main+0xc66/0x1670 [ptlrpc]
[ 6876.894784]  [&amp;lt;ffffffff810dbb51&amp;gt;] ? put_prev_entity+0x31/0x400
[ 6876.894784]  [&amp;lt;ffffffff814119f9&amp;gt;] ? do_raw_spin_unlock+0x49/0x90
[ 6876.894784]  [&amp;lt;ffffffffa064fc60&amp;gt;] ? ptlrpc_wait_event+0x620/0x620 [ptlrpc]
[ 6876.894784]  [&amp;lt;ffffffff810ba114&amp;gt;] kthread+0xe4/0xf0
[ 6876.894784]  [&amp;lt;ffffffff810ba030&amp;gt;] ? kthread_create_on_node+0x140/0x140
[ 6876.894784]  [&amp;lt;ffffffff817ede5d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[ 6876.894784]  [&amp;lt;ffffffff810ba030&amp;gt;] ? kthread_create_on_node+0x140/0x140
[ 6876.894784] Code: 28 ff 01 74 0d f6 05 c5 2a 28 ff 04 0f 85 92 07 00 00 48 63 45 b8 48 8d 04 80 48 01 c0 48 89 85 68 ff ff ff 49 03 87 98 00 00 00 &amp;lt;0f&amp;gt; b7 58 06 0f b7 40 08 83 c0 01 41 f6 87 a0 00 00 00 1e 44 0f 
[ 6876.901347] RIP  [&amp;lt;ffffffffa0f50aa6&amp;gt;] lod_declare_update_extents.isra.57+0x86/0x1910 [lod]
[ 6876.901347]  RSP &amp;lt;ffff88028bdeb738&amp;gt;
[ 6876.901347] CR2: 0000000000000006&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Here are crashes with crashdumps:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-100-2023-08-20-07:06:56/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-100-2023-08-20-07:06:56/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-115-2023-08-21-05:51:53/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-115-2023-08-21-05:51:53/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-105-2023-08-22-03:00:09/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-105-2023-08-22-03:00:09/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-50-2023-08-22-10:12:59/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://testing.linuxhacker.ru/lustre-reports/external/crashes/boilpot-bigmem-50-2023-08-22-10:12:59/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</description>
                <environment></environment>
        <key id="77562">LU-17048</key>
            <summary>Crash in lod_declare_update_extents</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="green">Oleg Drokin</reporter>
                        <labels>
                    </labels>
                <created>Wed, 23 Aug 2023 04:45:12 +0000</created>
                <updated>Fri, 26 Jan 2024 20:30:26 +0000</updated>
                            <resolved>Wed, 20 Dec 2023 02:29:15 +0000</resolved>
                                    <version>Lustre 2.16.0</version>
                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="383443" author="pjones" created="Wed, 23 Aug 2023 17:24:06 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Could you please investigate this as a priority?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="384013" author="gerrit" created="Tue, 29 Aug 2023 03:51:52 +0000"  >&lt;p&gt;&quot;Zhenyu Xu &amp;lt;bobijam@hotmail.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/52146&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/52146&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17048&quot; title=&quot;Crash in lod_declare_update_extents&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17048&quot;&gt;&lt;del&gt;LU-17048&lt;/del&gt;&lt;/a&gt; mdd: protect layout in MDD layer&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 91c9ce720b5a81774f3ce5e7a3c25e7bb64d0853&lt;/p&gt;</comment>
                            <comment id="384131" author="adilger" created="Tue, 29 Aug 2023 22:24:29 +0000"  >&lt;p&gt;It looks like patch &lt;a href=&quot;https://review.whamcloud.com/43366&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43366&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14621&quot; title=&quot;Broken lock-transaction ordering in MDS code&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14621&quot;&gt;&lt;del&gt;LU-14621&lt;/del&gt;&lt;/a&gt; mdd: fix lock-tx order in mdd_xattr_merge()&lt;/tt&gt;&quot; landed in v2_14_53-2-gb7bd4e3422 moved the mdd_write_lock() calls from covering the layouts during layout swap down after &lt;tt&gt;mdd_trans_start()&lt;/tt&gt; to avoid a lock ordering deadlock, but it looks like that opened up the race condition for changing the layout here.&lt;/p&gt;</comment>
                            <comment id="384636" author="JIRAUSER17900" created="Sat, 2 Sep 2023 01:43:17 +0000"  >&lt;p&gt;2023-09-02: The fix patch is being worked on.&lt;/p&gt;</comment>
                            <comment id="394160" author="JIRAUSER17900" created="Fri, 24 Nov 2023 10:21:32 +0000"  >&lt;p&gt;2023-11-24: The fix patch is being reviewed.&lt;/p&gt;</comment>
                            <comment id="396142" author="JIRAUSER17900" created="Sat, 9 Dec 2023 04:49:16 +0000"  >&lt;p&gt; 2023-12-16: The fix patch is ready to land to master(on master-next branch).&lt;/p&gt;</comment>
                            <comment id="397526" author="gerrit" created="Wed, 20 Dec 2023 01:43:47 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/52146/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/52146/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17048&quot; title=&quot;Crash in lod_declare_update_extents&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17048&quot;&gt;&lt;del&gt;LU-17048&lt;/del&gt;&lt;/a&gt; mdd: protect layout change in MDD layer&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: d5ab62af24166529b84b4d7227b96d3a69989a95&lt;/p&gt;</comment>
                            <comment id="397559" author="pjones" created="Wed, 20 Dec 2023 02:29:15 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="63839">LU-14621</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="65953">LU-14988</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i03tnr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>