<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:32:56 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10198] GPF llog_osd_declare_write_rec+0xb6/0x3d0 </title>
                <link>https://jira.whamcloud.com/browse/LU-10198</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 1890.299266] LustreError: 19229:0:(mdd_device.c:263:llog_changelog_cancel()) lustre-MDD0000: cancel idx 23 of catalog [0x5:0xa:0x0]: rc = -2
[ 1890.291625] Modules linked in: loop lustre(OE) ofd(OE) osp(OE) lod(OE) ost(OE) mdt(OE) mdd(OE) mgs(OE) osd_ldiskfs(OE) ldiskfs(OE) mbcache lquota(OE) lfsck(OE) jbd2 obdecho(OE) mgc(OE) lov(OE) osc(OE) mdc(OE) lmv(OE) fid(OE) fld(OE) ptlrpc(OE) obdclass(OE) ksocklnd(OE) lnet(OE) libcfs(OE) ip6t_rpfilter ipt_REJECT nf_reject_ipv4 ip6t_REJECT nf_reject_ipv6 xt_conntrack ip_set nfnetlink ebtable_nat ebtable_broute bridge stp llc ip6table_nat nf_conntrack_ipv6 nf_defrag_ipv6 nf_nat_ipv6 ip6table_mangle ip6table_security ip6table_raw iptable_nat nf_conntrack_ipv4 nf_defrag_ipv4 nf_nat_ipv4 nf_nat nf_conntrack iptable_mangle iptable_security iptable_raw ebtable_filter ebtables ip6table_filter ip6_tables iptable_filter vboxsf(OE) snd_intel8x0 snd_ac97_codec ac97_bus snd_seq snd_seq_device snd_pcm iosf_mbi
[ 1890.308621]  crc32_pclmul ghash_clmulni_intel aesni_intel lrw gf128mul glue_helper snd_timer ppdev pcspkr snd ablk_helper soundcore cryptd virtio_net sg vboxvideo(OE) vboxguest(OE) ttm drm_kms_helper syscopyarea sysfillrect sysimgblt fb_sys_fops video drm i2c_piix4 parport_pc parport i2c_core nfsd auth_rpcgss nfs_acl lockd grace sunrpc ip_tables xfs libcrc32c sd_mod crc_t10dif crct10dif_generic sr_mod cdrom ata_generic pata_acpi ahci libahci e1000 ata_piix crct10dif_pclmul crct10dif_common crc32c_intel libata serio_raw virtio_pci virtio_ring virtio dm_mirror dm_region_hash dm_log dm_mod
[ 1890.317566] CPU: 3 PID: 19257 Comm: lctl Tainted: G           OE  ------------   3.10.0-693.2.2.el7_lustre.x86_64 #1
[ 1890.320750] Hardware name: innotek GmbH VirtualBox/VirtualBox, BIOS VirtualBox 12/01/2006
[ 1890.322062] task: ffff88007beddee0 ti: ffff880075950000 task.ti: ffff880075950000
[ 1890.323310] RIP: 0010:[&amp;lt;ffffffffc07ba9b6&amp;gt;]  [&amp;lt;ffffffffc07ba9b6&amp;gt;] llog_osd_declare_write_rec+0xb6/0x3d0 [obdclass]
[ 1890.325834] RSP: 0018:ffff8800759537a8  EFLAGS: 00010206
[ 1890.327262] RAX: 5a5a5a5a5a5a5a5a RBX: ffff880067977000 RCX: 0000000000000000
[ 1890.328622] RDX: 0000000000000000 RSI: 0000000000000000 RDI: ffff88007a9b2580
[ 1890.329976] RBP: ffff8800759537d8 R08: 0000000000000001 R09: 000000000000ffef
[ 1890.331375] R10: 0000000000002000 R11: 000000000000000f R12: ffff880075953d88
[ 1890.332884] R13: ffff880067d70840 R14: ffff880067977078 R15: ffff8800671e1c00
[ 1890.334374] FS:  00007f173df09740(0000) GS:ffff88007fd80000(0000) knlGS:0000000000000000
[ 1890.336313] CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
[ 1890.338548] CR2: 00007fbcc671ae40 CR3: 000000006c198000 CR4: 00000000000406e0
[ 1890.339733] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[ 1890.340838] DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
[ 1890.341975] Stack:
[ 1890.343053]  ffff8800000029b9 ffff8800671e1200 ffffffffc1057100 ffff880075953d88
[ 1890.344121]  ffff88006a054000 00000000000029b9 ffff880075953818 ffffffffc07af174
[ 1890.345200]  ffff880067d70840 ffff8800671e1200 ffff880067d70840 ffff880075953d88
[ 1890.346339] Call Trace:
[ 1890.347426]  [&amp;lt;ffffffffc07af174&amp;gt;] llog_declare_write_rec+0x84/0x200 [obdclass]
[ 1890.348452]  [&amp;lt;ffffffffc07af8f2&amp;gt;] llog_cancel_rec+0xe2/0x870 [obdclass]
[ 1890.349732]  [&amp;lt;ffffffffc07b66fa&amp;gt;] llog_cat_cancel_records+0x13a/0x2e0 [obdclass]
[ 1890.350742]  [&amp;lt;ffffffffc0662c47&amp;gt;] ? libcfs_debug_msg+0x57/0x80 [libcfs]
[ 1890.351750]  [&amp;lt;ffffffffc10143d4&amp;gt;] llog_changelog_cancel_cb+0xe4/0x1d0 [mdd]
[ 1890.353074]  [&amp;lt;ffffffffc07b08f5&amp;gt;] llog_process_thread+0x875/0x1460 [obdclass]
[ 1890.354407]  [&amp;lt;ffffffffc10142f0&amp;gt;] ? mdd_device_free+0x2a0/0x2a0 [mdd]
[ 1890.355508]  [&amp;lt;ffffffffc07b159c&amp;gt;] llog_process_or_fork+0xbc/0x450 [obdclass]
[ 1890.356457]  [&amp;lt;ffffffffc07b6ad9&amp;gt;] llog_cat_process_cb+0x239/0x250 [obdclass]
[ 1890.357413]  [&amp;lt;ffffffffc07b08f5&amp;gt;] llog_process_thread+0x875/0x1460 [obdclass]
[ 1890.358301]  [&amp;lt;ffffffffc07b68a0&amp;gt;] ? llog_cat_cancel_records+0x2e0/0x2e0 [obdclass]
[ 1890.359194]  [&amp;lt;ffffffffc07b159c&amp;gt;] llog_process_or_fork+0xbc/0x450 [obdclass]
[ 1890.360036]  [&amp;lt;ffffffffc07b68a0&amp;gt;] ? llog_cat_cancel_records+0x2e0/0x2e0 [obdclass]
[ 1890.360885]  [&amp;lt;ffffffffc07b5e69&amp;gt;] llog_cat_process_or_fork+0x199/0x2a0 [obdclass]
[ 1890.361731]  [&amp;lt;ffffffffc10142f0&amp;gt;] ? mdd_device_free+0x2a0/0x2a0 [mdd]
[ 1890.362529]  [&amp;lt;ffffffffc10142f0&amp;gt;] ? mdd_device_free+0x2a0/0x2a0 [mdd]
[ 1890.363344]  [&amp;lt;ffffffffc07b5f9e&amp;gt;] llog_cat_process+0x2e/0x30 [obdclass]
....

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;I can reproduce this using this test &lt;a href=&quot;https://review.whamcloud.com/#/c/29035/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/29035/&lt;/a&gt; in loop mode.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;   10986:       4d 8b 7e 70             mov    0x70(%r14),%r15
   1098a:       4d 85 ff                test   %r15,%r15
   1098d:       0f 84 9c 02 00 00       je     10c2f &amp;lt;llog_osd_declare_write_rec+0x32f&amp;gt;
   10993:       44 89 d0                mov    %r10d,%eax
   10996:       48 c7 43 78 00 00 00    movq   $0x0,0x78(%rbx)
   1099d:       00
   1099e:       4c 8d 73 78             lea    0x78(%rbx),%r14
   109a2:       48 89 83 80 00 00 00    mov    %rax,0x80(%rbx)
   109a9:       49 8b 47 30             mov    0x30(%r15),%rax
   109ad:       48 85 c0                test   %rax,%rax
   109b0:       0f 84 7a 01 00 00       je     10b30 &amp;lt;llog_osd_declare_write_rec+0x230&amp;gt;
   109b6:       48 8b 40 08             mov    0x8(%rax),%rax


&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;I have done quick analyze, fault happened when accessing&lt;br/&gt;
 llog_handle-&amp;gt;dt_object-&amp;gt;do_body_ops&lt;br/&gt;
 it contains poison (rax) 0x5a5a5a5a5a..&lt;br/&gt;
 It is great that dt_declare_record_write check for NULL pointer&lt;br/&gt;
 LASSERT(dt-&amp;gt;do_body_ops);&lt;br/&gt;
 maybe poison check is required here also? It will simplify analyze of future fails.&#160;&lt;/p&gt;</description>
                <environment>top of master&lt;br/&gt;
git log --oneline -n3&lt;br/&gt;
97fe841 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9994&quot; title=&quot;sanity-scrub test_5: test failed to respond and timed out&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9994&quot;&gt;&lt;strike&gt;LU-9994&lt;/strike&gt;&lt;/a&gt; obdclass: fix llog_cat_id2handle() error handling&lt;br/&gt;
3dcb7d0 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10132&quot; title=&quot;IO execvp errors 2.10 client/EE3.1.1 server&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10132&quot;&gt;&lt;strike&gt;LU-10132&lt;/strike&gt;&lt;/a&gt; llite: handle xattr cache refill race&lt;br/&gt;
ec6bdd5 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9951&quot; title=&quot;check whether  posix_acl_update_mode exists&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9951&quot;&gt;&lt;strike&gt;LU-9951&lt;/strike&gt;&lt;/a&gt; lustre_compat: add wrapper function for posix_acl_update_mode&lt;br/&gt;
</environment>
        <key id="49108">LU-10198</key>
            <summary>GPF llog_osd_declare_write_rec+0xb6/0x3d0 </summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="tappro">Mikhail Pershin</assignee>
                                    <reporter username="aboyko">Alexander Boyko</reporter>
                        <labels>
                            <label>llnl</label>
                    </labels>
                <created>Fri, 3 Nov 2017 13:54:01 +0000</created>
                <updated>Mon, 9 Mar 2020 20:07:39 +0000</updated>
                            <resolved>Sat, 8 Feb 2020 04:13:22 +0000</resolved>
                                                    <fixVersion>Lustre 2.14.0</fixVersion>
                    <fixVersion>Lustre 2.12.5</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="212749" author="aboyko" created="Fri, 3 Nov 2017 13:59:03 +0000"  >&lt;p&gt;Ooops, I miss the project, is it possible to move to LU?&lt;/p&gt;</comment>
                            <comment id="216271" author="tappro" created="Thu, 14 Dec 2017 09:52:37 +0000"  >&lt;p&gt;That looks like object in lgh_obj was freed by other thread while it is being used by the current thread. This can be result of llog_cat_id2handle() call, it may take already existing llog_handle but lgh_obj reference is not taken in that case, so concurrent llog_close() might drop it to zero and cause free. I am not 100% about that is exactly what happened there but I&apos;d look in that direction first. As quick solution for this we can add lu_object_get() into llog_handle_get() and lu_object_put() into llog_handle_put() calls. Could you try to reproduce this with such changes?&lt;/p&gt;</comment>
                            <comment id="262162" author="gerrit" created="Wed, 29 Jan 2020 22:06:35 +0000"  >&lt;p&gt;Mike Pershin (mpershin@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37367&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37367&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10198&quot; title=&quot;GPF llog_osd_declare_write_rec+0xb6/0x3d0 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10198&quot;&gt;&lt;del&gt;LU-10198&lt;/del&gt;&lt;/a&gt; llog: keep llog handle alive until last reference&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 467db9d4f3dd6b3036826033e8dbe222815b9463&lt;/p&gt;</comment>
                            <comment id="262882" author="gerrit" created="Sat, 8 Feb 2020 03:59:48 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37367/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37367/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10198&quot; title=&quot;GPF llog_osd_declare_write_rec+0xb6/0x3d0 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10198&quot;&gt;&lt;del&gt;LU-10198&lt;/del&gt;&lt;/a&gt; llog: keep llog handle alive until last reference&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: d6bd5e9cc49b3bb9901ada503107e8b0eca44f7e&lt;/p&gt;</comment>
                            <comment id="262913" author="pjones" created="Sat, 8 Feb 2020 04:13:22 +0000"  >&lt;p&gt;Landed for 2.14&lt;/p&gt;</comment>
                            <comment id="263010" author="gerrit" created="Mon, 10 Feb 2020 15:18:42 +0000"  >&lt;p&gt;Minh Diep (mdiep@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37514&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37514&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10198&quot; title=&quot;GPF llog_osd_declare_write_rec+0xb6/0x3d0 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10198&quot;&gt;&lt;del&gt;LU-10198&lt;/del&gt;&lt;/a&gt; llog: keep llog handle alive until last reference&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 163744fa5dd801941de6c3ca5a65b8231c82dd09&lt;/p&gt;</comment>
                            <comment id="263983" author="gerrit" created="Tue, 25 Feb 2020 06:16:03 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37514/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37514/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10198&quot; title=&quot;GPF llog_osd_declare_write_rec+0xb6/0x3d0 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10198&quot;&gt;&lt;del&gt;LU-10198&lt;/del&gt;&lt;/a&gt; llog: keep llog handle alive until last reference&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 4e3d745f82d0acf583975f7fbfcd3ce8841e9b9c&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="57472">LU-13018</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzn4f:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>