<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:22:25 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-15920] Interop parallel-scale-nfsv4: BUG: unable to handle kernel NULL pointer dereference at 0000000000000000</title>
                <link>https://jira.whamcloud.com/browse/LU-15920</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for sarah &amp;lt;sarah@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/d5c9683a-6143-4ddc-8225-daa1bb8cb3fe&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/d5c9683a-6143-4ddc-8225-daa1bb8cb3fe&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Before parallel-scale-nfsv4 ran, all test nodes crashed as&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[27499.656301] SysRq : Trigger a crash
[27499.657194] BUG: unable to handle kernel NULL pointer dereference at           (null)
[27499.658657] IP: [&amp;lt;ffffffff86a75596&amp;gt;] sysrq_handle_crash+0x16/0x20
[27499.660775] Oops: 0002 [#1] SMP 
27499.677098] CPU: 1 PID: 7956 Comm: bash Kdump: loaded Tainted: G           OE  ------------   3.10.0-1160.49.1.el7.x86_64 #1
[27499.678989] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[27499.681238] RIP: 0010:[&amp;lt;ffffffff86a75596&amp;gt;]  [&amp;lt;ffffffff86a75596&amp;gt;] sysrq_handle_crash+0x16/0x20
[27499.693443] Call Trace:
[27499.693909]  [&amp;lt;ffffffff86a75dbd&amp;gt;] __handle_sysrq+0x10d/0x170
[27499.694905]  [&amp;lt;ffffffff86a76228&amp;gt;] write_sysrq_trigger+0x28/0x40
[27499.695966]  [&amp;lt;ffffffff868c76f0&amp;gt;] proc_reg_write+0x40/0x80
[27499.696947]  [&amp;lt;ffffffff8684e590&amp;gt;] vfs_write+0xc0/0x1f0
[27499.699015]  [&amp;lt;ffffffff8684f36f&amp;gt;] SyS_write+0x7f/0xf0
[27499.701145]  [&amp;lt;ffffffff86d95f92&amp;gt;] system_call_fastpath+0x25/0x2a
[    0.000000] Initializing cgroup subsys cpuset
[    0.000000] Initializing cgroup subsys cpu
[    0.000000] Initializing cgroup subsys cpuacct
[    0.000000] Linux version 3.10.0-1160.49.1.el7.x86_64 (mockbuild@kbuilder.bsys.centos.org) (gcc version 4.8.5 20150623 (Red Hat 4.8.5-44) (GCC) ) #1 SMP Tue Nov 30 15:51:32 UTC 2021
[    0.000000] Command line: BOOT_IMAGE=/boot/vmlinuz-3.10.0-1160.49.1.el7.x86_64 ro console=ttyS0,115200 console=tty0 console=ttyS0,115200 net.ifnames=0 LANG=en_US.UTF-8 slab_nomerge slub_nomerge irqpoll nr_cpus=1 reset_devices cgroup_disable=memory mce=off numa=off udev.children-max=2 panic=10 acpi_no_memhotplug transparent_hugepage=never nokaslr novmcoredd hest_disable disable_cpu_apicid=0 elfcorehdr=867700K
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="70663">LU-15920</key>
            <summary>Interop parallel-scale-nfsv4: BUG: unable to handle kernel NULL pointer dereference at 0000000000000000</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Tue, 7 Jun 2022 19:04:13 +0000</created>
                <updated>Wed, 5 Apr 2023 17:46:43 +0000</updated>
                                            <version>Lustre 2.12.9</version>
                    <version>Lustre 2.15.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="336973" author="adilger" created="Tue, 7 Jun 2022 20:46:10 +0000"  >&lt;blockquote&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[27499.656301] SysRq : Trigger a crash
[27499.657194] BUG: unable to handle kernel NULL pointer dereference at           (null)
[27499.658657] IP: [&amp;lt;ffffffff86a75596&amp;gt;] sysrq_handle_crash+0x16/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;&lt;/blockquote&gt;
&lt;p&gt;This looks like &quot;&lt;tt&gt;sysrq-c&lt;/tt&gt;&quot; or &quot;&lt;tt&gt;echo c &amp;gt; /proc/sysrq-trigger&lt;/tt&gt;&quot; was run on the nodes.  I would suspect that autotest/ljb was doing this, maybe because of a problem in a previous test session, or similar?&lt;/p&gt;</comment>
                            <comment id="337739" author="sarah" created="Tue, 14 Jun 2022 17:03:00 +0000"  >&lt;p&gt;A similar error happened in 2.12.9 testing with Ubuntu client,  in conf-sanity test_83&lt;br/&gt;
&lt;a href=&quot;https://testing.whamcloud.com/test_sets/504767ec-1f5b-46c8-a1fa-2f39e5aad0d4&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/504767ec-1f5b-46c8-a1fa-2f39e5aad0d4&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;MDS console shows&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[25136.581679]           pickup  4951   7538652.811805        20   120         0.000000         9.608621         0.000000 0 /
[25136.583882]             bash  4998   7538802.056886        27   120         0.000000        10.687356         0.000000 0 /
[25136.586090] R           bash  5031   7539058.583248         2   120         0.000000       239.691301         0.000000 0 /
[25136.588298] 
[25138.305731] SysRq : Trigger a crash
[25138.306658] BUG: unable to handle kernel NULL pointer dereference at           (null)
[25138.308193] IP: [&amp;lt;ffffffff91075746&amp;gt;] sysrq_handle_crash+0x16/0x20
[25138.309346] PGD 80000000b9ef1067 PUD bb79d067 PMD 0 
[25138.310370] Oops: 0002 [#1] SMP 
[25138.311052] Modules linked in: dm_flakey osp(OE) mdd(OE) lod(OE) mdt(OE) lfsck(OE) mgs(OE) mgc(OE) osd_ldiskfs(OE) lquota(OE) fid(OE) fld(OE) ksocklnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE) ldiskfs(OE) libcfs(OE) loop rpcsec_gss_krb5 auth_rpcgss nfsv4 dns_resolver nfs lockd grace fscache rpcrdma ib_isert iscsi_target_mod ib_iser libiscsi scsi_transport_iscsi ib_srpt target_core_mod crc_t10dif crct10dif_generic ib_srp scsi_transport_srp scsi_tgt ib_ipoib rdma_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_core sunrpc dm_mod iosf_mbi crc32_pclmul ghash_clmulni_intel ppdev aesni_intel lrw gf128mul glue_helper pcspkr ablk_helper cryptd joydev virtio_balloon i2c_piix4 parport_pc parport ip_tables ext4 mbcache jbd2 ata_generic pata_acpi ata_piix virtio_net net_failover virtio_blk failover crct10dif_pclmul crct10dif_common crc32c_intel libata serio_raw virtio_pci virtio_ring virtio floppy [last unloaded: dm_flakey]
[25138.328431] CPU: 0 PID: 5080 Comm: bash Kdump: loaded Tainted: G           OE  ------------   3.10.0-1160.49.1.el7_lustre.x86_64 #1
[25138.330535] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[25138.331592] task: ffff9966d2eea100 ti: ffff9966bda8c000 task.ti: ffff9966bda8c000
[25138.332945] RIP: 0010:[&amp;lt;ffffffff91075746&amp;gt;]  [&amp;lt;ffffffff91075746&amp;gt;] sysrq_handle_crash+0x16/0x20
[25138.334517] RSP: 0018:ffff9966bda8fe58  EFLAGS: 00010246
[25138.335489] RAX: ffffffff91075730 RBX: ffffffff918e74a0 RCX: 0000000000000000
[25138.336770] RDX: 0000000000000000 RSI: ffff9966ffc138d8 RDI: 0000000000000063
[25138.338069] RBP: ffff9966bda8fe58 R08: ffffffff91c0387c R09: ffff9966c7d60f00
[25138.339372] R10: 000000000000467c R11: 000000000000467b R12: 0000000000000063
[25138.340657] R13: 0000000000000000 R14: 0000000000000008 R15: 0000000000000000
[25138.341946] FS:  00007fb90a545740(0000) GS:ffff9966ffc00000(0000) knlGS:0000000000000000
[25138.343407] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[25138.344455] CR2: 0000000000000000 CR3: 000000009a4a0000 CR4: 00000000000606f0
[25138.345742] Call Trace:
[25138.346217]  [&amp;lt;ffffffff91075f6d&amp;gt;] __handle_sysrq+0x10d/0x170
[25138.347246]  [&amp;lt;ffffffff910763d8&amp;gt;] write_sysrq_trigger+0x28/0x40
[25138.348324]  [&amp;lt;ffffffff90ec78a0&amp;gt;] proc_reg_write+0x40/0x80
[25138.349325]  [&amp;lt;ffffffff90e4e590&amp;gt;] vfs_write+0xc0/0x1f0
[25138.350267]  [&amp;lt;ffffffff91395ed5&amp;gt;] ? system_call_after_swapgs+0xa2/0x13a
[25138.351462]  [&amp;lt;ffffffff90e4f36f&amp;gt;] SyS_write+0x7f/0xf0
[25138.352385]  [&amp;lt;ffffffff91395ed5&amp;gt;] ? system_call_after_swapgs+0xa2/0x13a
[25138.353598]  [&amp;lt;ffffffff91395f92&amp;gt;] system_call_fastpath+0x25/0x2a
[25138.354682]  [&amp;lt;ffffffff91395ed5&amp;gt;] ? system_call_after_swapgs+0xa2/0x13a
[25138.355869] Code: eb 9b 45 01 f4 45 39 65 34 75 e5 4c 89 ef e8 e2 f7 ff ff eb db 66 66 66 66 90 55 48 89 e5 c7 05 91 27 7d 00 01 00 00 00 0f ae f8 &amp;lt;c6&amp;gt; 04 25 00 00 00 00 01 5d c3 66 66 66 66 90 55 31 c0 c7 05 0e 
[25138.361612] RIP  [&amp;lt;ffffffff91075746&amp;gt;] sysrq_handle_crash+0x16/0x20
[25138.362768]  RSP &amp;lt;ffff9966bda8fe58&amp;gt;
[25138.363421] CR2: 0000000000000000
[    0.000000] Initializing cgroup subsys cpuset
[    0.000000] Initializing cgroup subsys cpu
[    0.000000] Initializing cgroup subsys cpuacct
[    0.000000] Linux version 3.10.0-1160.49.1.el7_lustre.x86_64 (jenkins@onyx-203-el7-x8664-1.onyx.whamcloud.com) (gcc version 4.8.5 20150623 (Red Hat 4.8.5-39) (GCC) ) #1 SMP Thu Jun 2 13:15:53 UTC 2022
[    0.000000] Command line: BOOT_IMAGE=/boot/vmlinuz-3.10.0-1160.49.1.el7_lustre.x86_64 ro console=ttyS0,115200 console=tty0 console=ttyS0,115200 net.ifnames=0 LANG=en_US.UTF-8 slab_nomerge slub_nomerge irqpoll nr_cpus=1 reset_devices cgroup_disable=memory mce=off numa=off udev.children-max=2 panic=10 acpi_no_memhotplug transparent_hugepage=never nokaslr novmcoredd hest_disable disable_cpu_apicid=0 elfcorehdr=867700K
[    0.000000] e820: BIOS-provided physical RAM map:
[    0.000000] BIOS-e820: [mem 0x0000000000000000-0x0000000000000fff] reserved
[    0.000000] BIOS-e820: [mem 0x0000000000001000-0x000000000009f7ff] usable
[    0.000000] BIOS-e820: [mem 0x000000000009f800-0x000000000009ffff] reserved
[    0.000000] BIOS-e820: [mem 0x00000000000f0000-0x00000000000fffff] reserved
[    0.000000] BIOS-e820: [mem 0x0000000021000000-0x0000000034f5cfff] usable
[    0.000000] BIOS-e820: [mem 0x0000000034fff800-0x0000000034ffffff] usable
[    0.000000] BIOS-e820: [mem 0x00000000bfffa000-0x00000000bfffffff] reserved
[    0.000000] BIOS-e820: [mem 0x00000000feffc000-0x00000000feffffff] reserved
[    0.000000] BIOS-e820: [mem 0x00000000fffc0000-0x00000000ffffffff] reserved
[    0.000000] NX (Execute Disable) protection: active
[    0.000000] SMBIOS 2.4 present.
[    0.000000] DMI: Red Hat KVM, BIOS 0.5.1 01/01/2011
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="337780" author="adilger" created="Wed, 15 Jun 2022 00:25:57 +0000"  >&lt;blockquote&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[25138.305731] SysRq : Trigger a crash
[25138.306658] BUG: unable to handle kernel NULL pointer dereference at           (null)
[25138.308193] IP: [&amp;lt;ffffffff91075746&amp;gt;] sysrq_handle_crash+0x16/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;&lt;/blockquote&gt;
&lt;p&gt;This is again not so much a &quot;bug&quot; but rather something (user or test script) that is triggering a crash with &quot;&lt;tt&gt;echo c &amp;gt; /proc/sysrq-trigger&lt;/tt&gt;&quot;.  That might be autotest timing out the test and trying to reboot the node, or the test script doing &apos;hard&apos; failover, I&apos;m not sure.  It is likely to be something in the autotest area, so I&apos;ve added Charlie and Lee to the CC list.&lt;/p&gt;</comment>
                            <comment id="337877" author="colmstea" created="Wed, 15 Jun 2022 20:06:12 +0000"  >&lt;p&gt;Since &lt;a href=&quot;https://jira.whamcloud.com/browse/ATM-2248&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;https://jira.whamcloud.com/browse/ATM-2248&lt;/a&gt; was deployed, AT forces crash dumps on all nodes in the cluster upon a timeout.&lt;/p&gt;

&lt;p&gt;In the session referenced in the description, parallel-scale-nfsv4 actually started but timed out in the suite&apos;s startup phase. AFAIK, each suite goes through this startup phase but it is not recorded in auster&apos;s results.yml file which can make situations like this confusing. There is also a suite cleanup phase which is also not recorded.&lt;/p&gt;

&lt;p&gt;autotest_execution.log -&#160;&lt;a href=&quot;https://testing.whamcloud.com/test_logs/8ae1cf61-4779-449e-8431-e63e8620123e/show_text&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_logs/8ae1cf61-4779-449e-8431-e63e8620123e/show_text&lt;/a&gt;&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;2022-06-01T14:09:16 Suite parallel-scale-nfsv4 started
2022-06-01T14:10:15 Test running for 397 minutes
2022-06-01T14:11:15 Test running for 398 minutes
2022-06-01T14:12:15 Test running for 399 minutes
...
2022-06-01T15:06:15 Test running for 453 minutes
2022-06-01T15:07:15 Test running for 454 minutes
2022-06-01T15:08:15 Test running for 455 minutes
2022-06-01T15:09:10 Timing session out! Timeout has been exceeded but the test framework is still running
2022-06-01T15:09:10 Killing test framework...
2022-06-01T15:09:10 Test framework killed
2022-06-01T15:09:10 Suite parallel-scale-nfsv4 timed out, collecting logs...
2022-06-01T15:09:10 capturing timeout logs from trevis-42vm1
2022-06-01T15:09:15 Test running for 456 minutes
2022-06-01T15:09:15 capturing timeout logs from trevis-42vm2
2022-06-01T15:09:19 capturing timeout logs from trevis-42vm3
2022-06-01T15:09:26 capturing timeout logs from trevis-42vm4
2022-06-01T15:09:31 Forcing crash dumps on all nodes...
2022-06-01T15:09:31 trevis-42vm1 - Forcing crash dump...
2022-06-01T15:09:31 trevis-42vm2 - Forcing crash dump...
2022-06-01T15:09:31 trevis-42vm3 - Forcing crash dump...
2022-06-01T15:09:31 trevis-42vm4 - Forcing crash dump...
2022-06-01T15:10:15 Test running for 457 minutes
2022-06-01T15:10:15 Forcing crash dumps complete
2022-06-01T15:10:15 Collecting crash files...&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;&#160;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="70773">LU-15950</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02rmf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>