<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:35:45 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10511] Stack overflow (?) on ost osd ldiskfs write path?</title>
                <link>https://jira.whamcloud.com/browse/LU-10511</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;From time to time I am getting crashes like this:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[48156.988750] Lustre: lustre-OST0001: Imperative Recovery not enabled, recovery window 60-180
[48163.913945] Lustre: lustre-OST0000: Connection restored to 192.168.10.219@tcp (at 0@lo)
[48163.949542] BUG: sleeping function called from invalid context at /home/green/git/lustre-release/ldiskfs/ext4_jbd2.c:259
[48163.951038] in_atomic(): 1, irqs_disabled(): 0, pid: 4792, name: ll_ost00_002
[48163.951463] Lustre: Mounted lustre-client
[48163.953482] INFO: lockdep is turned off.
[48163.954365] CPU: 1 PID: 4792 Comm: ll_ost00_002 Tainted: G        W  OE  ------------   3.10.0-debug #1
[48163.956101] Hardware name: Bochs Bochs, BIOS Bochs 01/01/2011
[48163.957005]  ffff88004b92e6c0 000000000f8a8783 ffff880019e6f840 ffffffff816fd400
[48163.958581]  ffff880019e6f858 ffffffff810b0109 ffff88002f521f88 ffff880019e6f8b8
[48163.960111]  ffffffffa0a63308 ffff88002f521f88 0000000000000002 000000000f8a8783
[48163.961584] Call Trace:
[48163.962274]  [&amp;lt;ffffffff816fd400&amp;gt;] dump_stack+0x19/0x1b
[48163.963004]  [&amp;lt;ffffffff810b0109&amp;gt;] __might_sleep+0xe9/0x110
[48163.963787]  [&amp;lt;ffffffffa0a63308&amp;gt;] __ldiskfs_handle_dirty_metadata+0x38/0x230 [ldiskfs]
[48163.965210]  [&amp;lt;ffffffff810a4055&amp;gt;] ? wake_up_bit+0x25/0x30
[48163.965968]  [&amp;lt;ffffffffa0a77bb2&amp;gt;] ldiskfs_getblk+0x142/0x210 [ldiskfs]
[48163.966850]  [&amp;lt;ffffffffa0a77ca7&amp;gt;] ldiskfs_bread+0x27/0xe0 [ldiskfs]
[48163.967650]  [&amp;lt;ffffffffa0b14531&amp;gt;] osd_ldiskfs_write_record+0x181/0x3d0 [osd_ldiskfs]
[48163.968765]  [&amp;lt;ffffffff810e3244&amp;gt;] ? lockdep_init_map+0xc4/0x600
[48163.969398]  [&amp;lt;ffffffffa0b148c0&amp;gt;] osd_write+0x140/0x5b0 [osd_ldiskfs]
[48163.970006]  [&amp;lt;ffffffffa03bfd09&amp;gt;] dt_record_write+0x39/0x120 [obdclass]
[48163.970690]  [&amp;lt;ffffffffa063fb37&amp;gt;] tgt_client_data_write.isra.18+0x167/0x180 [ptlrpc]
[48163.971859]  [&amp;lt;ffffffffa06431d3&amp;gt;] tgt_client_data_update+0x393/0x5d0 [ptlrpc]
[48163.972595]  [&amp;lt;ffffffffa064382b&amp;gt;] tgt_client_new+0x41b/0x610 [ptlrpc]
[48163.973432]  [&amp;lt;ffffffffa0db6ff3&amp;gt;] ofd_obd_connect+0x3a3/0x4c0 [ofd]
[48163.974487]  [&amp;lt;ffffffffa05ad028&amp;gt;] target_handle_connect+0x1118/0x29e0 [ptlrpc]
[48163.976234]  [&amp;lt;ffffffffa065275a&amp;gt;] tgt_request_handle+0x40a/0x13e0 [ptlrpc]
[48163.977196]  [&amp;lt;ffffffffa05f7c21&amp;gt;] ptlrpc_server_handle_request+0x261/0xaf0 [ptlrpc]
[48163.978766]  [&amp;lt;ffffffffa05fb9d8&amp;gt;] ptlrpc_main+0xa58/0x1df0 [ptlrpc]
[48163.979522]  [&amp;lt;ffffffff81706487&amp;gt;] ? _raw_spin_unlock_irq+0x27/0x50
[48163.980246]  [&amp;lt;ffffffffa05faf80&amp;gt;] ? ptlrpc_register_service+0xeb0/0xeb0 [ptlrpc]
[48163.981587]  [&amp;lt;ffffffff810a2eda&amp;gt;] kthread+0xea/0xf0
[48163.982154]  [&amp;lt;ffffffff810a2df0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[48163.983448]  [&amp;lt;ffffffff8170fbd8&amp;gt;] ret_from_fork+0x58/0x90
[48163.984044]  [&amp;lt;ffffffff810a2df0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[48163.984926] LNetError: 4792:0:(lib-lnet.h:479:lnet_msg_alloc()) ASSERTION( !(((current_thread_info()-&amp;gt;preempt_count) &amp;amp; ((((1UL &amp;lt;&amp;lt; (10))-1) &amp;lt;&amp;lt; ((0 + 8) + 8)) | (((1UL &amp;lt;&amp;lt; (8))-1) &amp;lt;&amp;lt; (0 + 8)) | (((1UL &amp;lt;&amp;lt; (1))-1) &amp;lt;&amp;lt; (((0 + 8) + 8) + 10))))) || (((sizeof(*msg))) &amp;lt;= (2 &amp;lt;&amp;lt; 12) &amp;amp;&amp;amp; (((((( gfp_t)0x10u) | (( gfp_t)0x40u)))) &amp;amp; ((( gfp_t)0x20u)))) != 0 ) failed:
[48163.988383] LNetError: 4792:0:(lib-lnet.h:479:lnet_msg_alloc()) LBUG
[48163.989081] Kernel panic - not syncing: LBUG in interrupt.

[48163.990700] CPU: 1 PID: 4792 Comm: ll_ost00_002 Tainted: G        W  OE  ------------   3.10.0-debug #1
[48163.992415] Hardware name: Bochs Bochs, BIOS Bochs 01/01/2011
[48163.993321]  ffffffffa01d81fe 000000000f8a8783 ffff880019e6f9f8 ffffffff816fd400
[48163.995039]  ffff880019e6fa78 ffffffff816f8c74 0000000000000008 ffff880019e6fa88
[48163.996763]  ffff880019e6fa28 000000000f8a8783 0000000000000010 0000000000000001
[48163.998433] Call Trace:
[48163.999220]  [&amp;lt;ffffffff816fd400&amp;gt;] dump_stack+0x19/0x1b
[48164.000084]  [&amp;lt;ffffffff816f8c74&amp;gt;] panic+0xd8/0x1e7
[48164.000910]  [&amp;lt;ffffffffa01b8882&amp;gt;] lbug_with_loc+0x72/0xb0 [libcfs]
[48164.001591]  [&amp;lt;ffffffffa030408c&amp;gt;] LNetPut+0x6bc/0x7a0 [lnet]
[48164.002227]  [&amp;lt;ffffffffa05e32c6&amp;gt;] ptl_send_buf+0x146/0x530 [ptlrpc]
[48164.002921]  [&amp;lt;ffffffffa0606a37&amp;gt;] ? at_measured+0x1c7/0x380 [ptlrpc]
[48164.003661]  [&amp;lt;ffffffffa05e6711&amp;gt;] ptlrpc_send_reply+0x2c1/0x890 [ptlrpc]
[48164.004379]  [&amp;lt;ffffffffa05a60b1&amp;gt;] target_send_reply_msg+0x91/0x180 [ptlrpc]
[48164.005048]  [&amp;lt;ffffffffa05b0736&amp;gt;] target_send_reply+0x326/0x750 [ptlrpc]
[48164.005788]  [&amp;lt;ffffffffa05ed597&amp;gt;] ? lustre_msg_set_last_committed+0x27/0xa0 [ptlrpc]
[48164.007091]  [&amp;lt;ffffffffa06528e7&amp;gt;] tgt_request_handle+0x597/0x13e0 [ptlrpc]
[48164.007971]  [&amp;lt;ffffffffa05f7c21&amp;gt;] ptlrpc_server_handle_request+0x261/0xaf0 [ptlrpc]
[48164.009154]  [&amp;lt;ffffffffa05fb9d8&amp;gt;] ptlrpc_main+0xa58/0x1df0 [ptlrpc]
[48164.009735]  [&amp;lt;ffffffff81706487&amp;gt;] ? _raw_spin_unlock_irq+0x27/0x50
[48164.010363]  [&amp;lt;ffffffffa05faf80&amp;gt;] ? ptlrpc_register_service+0xeb0/0xeb0 [ptlrpc]
[48164.011738]  [&amp;lt;ffffffff810a2eda&amp;gt;] kthread+0xea/0xf0
[48164.012328]  [&amp;lt;ffffffff810a2df0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[48164.013853]  [&amp;lt;ffffffff8170fbd8&amp;gt;] ret_from_fork+0x58/0x90
[48164.014732]  [&amp;lt;ffffffff810a2df0&amp;gt;] ? kthread_create_on_node+0x140/0x140
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I think this is a sign of a stack overflow sometime earlier that ruined our tasks kernel data making it think all sort of incorrect things like that we are in irq/atomic context and whatnot&lt;/p&gt;</description>
                <environment></environment>
        <key id="50224">LU-10511</key>
            <summary>Stack overflow (?) on ost osd ldiskfs write path?</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="green">Oleg Drokin</reporter>
                        <labels>
                    </labels>
                <created>Sun, 14 Jan 2018 21:04:34 +0000</created>
                <updated>Sun, 14 Jan 2018 21:04:34 +0000</updated>
                                                                                <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzr47:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>