<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:14:37 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1216] LBUG: ASSERTION(lli-&gt;lli_sai == NULL) failed using robinhood tool</title>
                <link>https://jira.whamcloud.com/browse/LU-1216</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;We&apos;re running a backup purpose application, robinhood, which reads changes from lustre changelog and then performs copies from lustre to another backend . We&apos;re often having the same crash on the client node performing all these actions.&lt;/p&gt;

&lt;p&gt;Before the crash I can see some llog threads blocked for more than 120 seconds (see dmesg attached). Then I get some errors reading the directory being accessed and finally the LBUG is raised.&lt;/p&gt;

&lt;p&gt;See attached file to see complete dmesg:&lt;/p&gt;

&lt;p&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104c67d&amp;gt;&amp;#93;&lt;/span&gt; ? wake_up_new_task+0xed/0x150&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81066790&amp;gt;&amp;#93;&lt;/span&gt; ? process_timeout+0x0/0x10&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147cb05&amp;gt;&amp;#93;&lt;/span&gt; schedule_timeout+0x205/0x2d0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fcd10&amp;gt;&amp;#93;&lt;/span&gt; ? llog_process_thread+0x0/0xe70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81004142&amp;gt;&amp;#93;&lt;/span&gt; ? kernel_thread+0x82/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fcd10&amp;gt;&amp;#93;&lt;/span&gt; ? llog_process_thread+0x0/0xe70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147c793&amp;gt;&amp;#93;&lt;/span&gt; wait_for_common+0x123/0x180&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104cf40&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0581cba&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_create_thread+0x7a/0xa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ffa90&amp;gt;&amp;#93;&lt;/span&gt; ? llog_cat_process_cb+0x0/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147c8ad&amp;gt;&amp;#93;&lt;/span&gt; wait_for_completion+0x1d/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fbb33&amp;gt;&amp;#93;&lt;/span&gt; llog_process_flags+0xf3/0x660 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0751587&amp;gt;&amp;#93;&lt;/span&gt; ? llog_client_read_header+0x187/0x640 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05feef8&amp;gt;&amp;#93;&lt;/span&gt; llog_cat_process_flags+0x188/0x2d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fdfef&amp;gt;&amp;#93;&lt;/span&gt; ? llog_init_handle+0x17f/0xa70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0890240&amp;gt;&amp;#93;&lt;/span&gt; ? changelog_show_cb+0x0/0x310 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08998bb&amp;gt;&amp;#93;&lt;/span&gt; mdc_changelog_send_thread+0x4cb/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810017bc&amp;gt;&amp;#93;&lt;/span&gt; ? __switch_to+0x1ac/0x320&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810041aa&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810041a0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
INFO: task mdc_clg_send_th:4499 blocked for more than 120 seconds.&lt;br/&gt;
&quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot; disables this message.&lt;br/&gt;
mdc_clg_send_ D 0000000000000001     0  4499      2 0x00000080&lt;br/&gt;
 ffff8823b3e53c40 0000000000000046 ffff8823b3e53bd0 ffffffff8104c67d&lt;br/&gt;
 ffff8823b3e53c80 0000000000000282 ffff8823b3f7c900 0000000000000000&lt;br/&gt;
 ffff8823b3f7ccc8 ffff8823b3e53fd8 000000000000db00 ffff8823b3f7ccc8&lt;br/&gt;
Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104c67d&amp;gt;&amp;#93;&lt;/span&gt; ? wake_up_new_task+0xed/0x150&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81066790&amp;gt;&amp;#93;&lt;/span&gt; ? process_timeout+0x0/0x10&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147cb05&amp;gt;&amp;#93;&lt;/span&gt; schedule_timeout+0x205/0x2d0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fcd10&amp;gt;&amp;#93;&lt;/span&gt; ? llog_process_thread+0x0/0xe70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81004142&amp;gt;&amp;#93;&lt;/span&gt; ? kernel_thread+0x82/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fcd10&amp;gt;&amp;#93;&lt;/span&gt; ? llog_process_thread+0x0/0xe70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147c793&amp;gt;&amp;#93;&lt;/span&gt; wait_for_common+0x123/0x180&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104cf40&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0581cba&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_create_thread+0x7a/0xa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ffa90&amp;gt;&amp;#93;&lt;/span&gt; ? llog_cat_process_cb+0x0/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147c8ad&amp;gt;&amp;#93;&lt;/span&gt; wait_for_completion+0x1d/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fbb33&amp;gt;&amp;#93;&lt;/span&gt; llog_process_flags+0xf3/0x660 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0751587&amp;gt;&amp;#93;&lt;/span&gt; ? llog_client_read_header+0x187/0x640 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05feef8&amp;gt;&amp;#93;&lt;/span&gt; llog_cat_process_flags+0x188/0x2d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05fdfef&amp;gt;&amp;#93;&lt;/span&gt; ? llog_init_handle+0x17f/0xa70 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0890240&amp;gt;&amp;#93;&lt;/span&gt; ? changelog_show_cb+0x0/0x310 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08998bb&amp;gt;&amp;#93;&lt;/span&gt; mdc_changelog_send_thread+0x4cb/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810017bc&amp;gt;&amp;#93;&lt;/span&gt; ? __switch_to+0x1ac/0x320&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810041aa&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08993f0&amp;gt;&amp;#93;&lt;/span&gt; ? mdc_changelog_send_thread+0x0/0xb90 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810041a0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
LustreError: 4491:0:(dir.c:478:ll_get_dir_page()) read cache page: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: rc -1&lt;br/&gt;
LustreError: 4491:0:(statahead.c:1001:is_first_dirent()) error reading dir &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: &lt;span class=&quot;error&quot;&gt;&amp;#91;rc -1&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;parent 4491&amp;#93;&lt;/span&gt;&lt;br/&gt;
LustreError: 8003:0:(dir.c:439:ll_get_dir_page()) dir page locate: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: rc -5&lt;br/&gt;
LustreError: 4485:0:(dir.c:439:ll_get_dir_page()) dir page locate: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: rc -5&lt;br/&gt;
LustreError: 4485:0:(statahead.c:1001:is_first_dirent()) error reading dir &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: &lt;span class=&quot;error&quot;&gt;&amp;#91;rc -5&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;parent 4485&amp;#93;&lt;/span&gt;&lt;br/&gt;
LustreError: 4493:0:(dir.c:439:ll_get_dir_page()) dir page locate: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: rc -5&lt;br/&gt;
LustreError: 4493:0:(dir.c:439:ll_get_dir_page()) Skipped 1 previous similar message&lt;br/&gt;
LustreError: 4493:0:(statahead.c:1001:is_first_dirent()) error reading dir &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: &lt;span class=&quot;error&quot;&gt;&amp;#91;rc -5&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;parent 4493&amp;#93;&lt;/span&gt;&lt;br/&gt;
LustreError: 4493:0:(dir.c:439:ll_get_dir_page()) dir page locate: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: rc -5&lt;br/&gt;
LustreError: 4493:0:(dir.c:439:ll_get_dir_page()) Skipped 1 previous similar message&lt;br/&gt;
LustreError: 4493:0:(statahead.c:1001:is_first_dirent()) error reading dir &lt;span class=&quot;error&quot;&gt;&amp;#91;0x200000002:0x2:0x0&amp;#93;&lt;/span&gt; at 0: &lt;span class=&quot;error&quot;&gt;&amp;#91;rc -5&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;parent 0&amp;#93;&lt;/span&gt;&lt;br/&gt;
LustreError: 4483:0:(file.c:525:ll_file_open()) ASSERTION(lli-&amp;gt;lli_sai == NULL) failed&lt;br/&gt;
LustreError: 4483:0:(file.c:525:ll_file_open()) LBUG&lt;br/&gt;
Pid: 4483, comm: rbh-backup&lt;/p&gt;

&lt;p&gt;Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa057e855&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x55/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa057ee95&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x75/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa058ae46&amp;gt;&amp;#93;&lt;/span&gt; libcfs_assertion_failed+0x66/0x70 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa098398c&amp;gt;&amp;#93;&lt;/span&gt; ll_file_open+0xe0c/0xe60 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0990171&amp;gt;&amp;#93;&lt;/span&gt; ? ll_finish_md_op_data+0x2a1/0x4a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa09654f4&amp;gt;&amp;#93;&lt;/span&gt; ? ll_revalidate_it_finish+0x64/0x240 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a8e0&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x0/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a917&amp;gt;&amp;#93;&lt;/span&gt; ll_dir_open+0x37/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115e5fa&amp;gt;&amp;#93;&lt;/span&gt; ? file_move+0x4a/0x70&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a59a&amp;gt;&amp;#93;&lt;/span&gt; __dentry_open+0x10a/0x350&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a979&amp;gt;&amp;#93;&lt;/span&gt; lookup_instantiate_filp+0x69/0x90&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0969701&amp;gt;&amp;#93;&lt;/span&gt; ll_revalidate_nd+0x331/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116b07a&amp;gt;&amp;#93;&lt;/span&gt; do_lookup+0x5a/0x220&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116b7a9&amp;gt;&amp;#93;&lt;/span&gt; __link_path_walk+0x569/0x820&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a8e0&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x0/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a917&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x37/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116c12a&amp;gt;&amp;#93;&lt;/span&gt; path_walk+0x6a/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116c2fb&amp;gt;&amp;#93;&lt;/span&gt; do_path_lookup+0x5b/0xa0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115e811&amp;gt;&amp;#93;&lt;/span&gt; ? get_empty_filp+0xa1/0x170&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116cf6b&amp;gt;&amp;#93;&lt;/span&gt; do_filp_open+0xfb/0xd30&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0985784&amp;gt;&amp;#93;&lt;/span&gt; ? ll_file_release+0x2e4/0x430 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8117bbb0&amp;gt;&amp;#93;&lt;/span&gt; ? mntput_no_expire+0x30/0x110&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81179ba2&amp;gt;&amp;#93;&lt;/span&gt; ? alloc_fd+0x92/0x160&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a349&amp;gt;&amp;#93;&lt;/span&gt; do_sys_open+0x69/0x140&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810044f5&amp;gt;&amp;#93;&lt;/span&gt; ? math_state_restore+0x45/0x60&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a460&amp;gt;&amp;#93;&lt;/span&gt; sys_open+0x20/0x30&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81003172&amp;gt;&amp;#93;&lt;/span&gt; system_call_fastpath+0x16/0x1b&lt;/p&gt;

&lt;p&gt;Kernel panic - not syncing: LBUG&lt;br/&gt;
Pid: 4483, comm: rbh-backup Tainted: G           ---------------- T 2.6.32-131.12.1.bl6.Bull.26.x86_64 #1&lt;br/&gt;
Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8147b742&amp;gt;&amp;#93;&lt;/span&gt; ? panic+0x78/0x143&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa057eeeb&amp;gt;&amp;#93;&lt;/span&gt; ? lbug_with_loc+0xcb/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa058ae46&amp;gt;&amp;#93;&lt;/span&gt; ? libcfs_assertion_failed+0x66/0x70 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa098398c&amp;gt;&amp;#93;&lt;/span&gt; ? ll_file_open+0xe0c/0xe60 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0990171&amp;gt;&amp;#93;&lt;/span&gt; ? ll_finish_md_op_data+0x2a1/0x4a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa09654f4&amp;gt;&amp;#93;&lt;/span&gt; ? ll_revalidate_it_finish+0x64/0x240 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a8e0&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x0/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a917&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x37/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115e5fa&amp;gt;&amp;#93;&lt;/span&gt; ? file_move+0x4a/0x70&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a59a&amp;gt;&amp;#93;&lt;/span&gt; ? __dentry_open+0x10a/0x350&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a979&amp;gt;&amp;#93;&lt;/span&gt; ? lookup_instantiate_filp+0x69/0x90&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0969701&amp;gt;&amp;#93;&lt;/span&gt; ? ll_revalidate_nd+0x331/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116b07a&amp;gt;&amp;#93;&lt;/span&gt; ? do_lookup+0x5a/0x220&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116b7a9&amp;gt;&amp;#93;&lt;/span&gt; ? __link_path_walk+0x569/0x820&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a8e0&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x0/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa096a917&amp;gt;&amp;#93;&lt;/span&gt; ? ll_dir_open+0x37/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116c12a&amp;gt;&amp;#93;&lt;/span&gt; ? path_walk+0x6a/0xe0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116c2fb&amp;gt;&amp;#93;&lt;/span&gt; ? do_path_lookup+0x5b/0xa0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115e811&amp;gt;&amp;#93;&lt;/span&gt; ? get_empty_filp+0xa1/0x170&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116cf6b&amp;gt;&amp;#93;&lt;/span&gt; ? do_filp_open+0xfb/0xd30&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0985784&amp;gt;&amp;#93;&lt;/span&gt; ? ll_file_release+0x2e4/0x430 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8117bbb0&amp;gt;&amp;#93;&lt;/span&gt; ? mntput_no_expire+0x30/0x110&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81179ba2&amp;gt;&amp;#93;&lt;/span&gt; ? alloc_fd+0x92/0x160&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a349&amp;gt;&amp;#93;&lt;/span&gt; ? do_sys_open+0x69/0x140&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810044f5&amp;gt;&amp;#93;&lt;/span&gt; ? math_state_restore+0x45/0x60&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8115a460&amp;gt;&amp;#93;&lt;/span&gt; ? sys_open+0x20/0x30&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81003172&amp;gt;&amp;#93;&lt;/span&gt; ? system_call_fastpath+0x16/0x1b&lt;/p&gt;


&lt;p&gt;And the associated bt for rbh (robinhood running thread) process. The complete crash file could be provided if needed.&lt;/p&gt;

&lt;p&gt;crash&amp;gt; bt&lt;br/&gt;
PID: 4483   TASK: ffff8823b3f28a80  CPU: 1   COMMAND: &quot;rbh-backup&quot;&lt;br/&gt;
 #0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e977f0&amp;#93;&lt;/span&gt; machine_kexec at ffffffff81027a2b&lt;br/&gt;
 #1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97850&amp;#93;&lt;/span&gt; crash_kexec at ffffffff810a3a52&lt;br/&gt;
 #2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97920&amp;#93;&lt;/span&gt; panic at ffffffff8147b749&lt;br/&gt;
 #3 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e979a0&amp;#93;&lt;/span&gt; lbug_with_loc at ffffffffa057eeeb&lt;br/&gt;
 #4 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e979f0&amp;#93;&lt;/span&gt; libcfs_assertion_failed at ffffffffa058ae46&lt;br/&gt;
 #5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97a40&amp;#93;&lt;/span&gt; ll_file_open at ffffffffa098398c&lt;br/&gt;
 #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97b50&amp;#93;&lt;/span&gt; ll_dir_open at ffffffffa096a917&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97ba0&amp;#93;&lt;/span&gt; __dentry_open at ffffffff8115a59a&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97c00&amp;#93;&lt;/span&gt; lookup_instantiate_filp at ffffffff8115a979&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97c20&amp;#93;&lt;/span&gt; ll_revalidate_nd at ffffffffa0969701&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97c80&amp;#93;&lt;/span&gt; do_lookup at ffffffff8116b07a&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97ce0&amp;#93;&lt;/span&gt; __link_path_walk at ffffffff8116b7a9&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97d60&amp;#93;&lt;/span&gt; path_walk at ffffffff8116c12a&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97da0&amp;#93;&lt;/span&gt; do_path_lookup at ffffffff8116c2fb&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97dd0&amp;#93;&lt;/span&gt; do_filp_open at ffffffff8116cf6b&lt;br/&gt;
#15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97f20&amp;#93;&lt;/span&gt; do_sys_open at ffffffff8115a349&lt;br/&gt;
#16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97f70&amp;#93;&lt;/span&gt; sys_open at ffffffff8115a460&lt;br/&gt;
#17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8823b3e97f80&amp;#93;&lt;/span&gt; system_call_fastpath at ffffffff81003172&lt;br/&gt;
    RIP: 000000354a20ed4d  RSP: 00007fe88e2bf5e8  RFLAGS: 00010246&lt;br/&gt;
    RAX: 0000000000000002  RBX: ffffffff81003172  RCX: 0000000000000000&lt;br/&gt;
    RDX: 0000000000000000  RSI: 0000000000000000  RDI: 00007fe8880071f0&lt;br/&gt;
    RBP: 00007fe88e2c09c2   R8: 0000000000000000   R9: 0000000000000000&lt;br/&gt;
    R10: fffffffffffffff0  R11: 0000000000000293  R12: ffffffff8115a460&lt;br/&gt;
    R13: ffff8823b3e97f78  R14: 0000000000000003  R15: 00007fe88e2be5c0&lt;br/&gt;
    ORIG_RAX: 0000000000000002  CS: 0033  SS: 002b&lt;/p&gt;</description>
                <environment>Lustre-2.1.0 with 2.6.32-131.12.1 kernel </environment>
        <key id="13564">LU-1216</key>
            <summary>LBUG: ASSERTION(lli-&gt;lli_sai == NULL) failed using robinhood tool</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="dmoreno">Diego Moreno</reporter>
                        <labels>
                    </labels>
                <created>Wed, 14 Mar 2012 06:12:04 +0000</created>
                <updated>Sun, 26 Aug 2012 10:35:20 +0000</updated>
                            <resolved>Thu, 29 Mar 2012 09:49:29 +0000</resolved>
                                                    <fixVersion>Lustre 2.1.3</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="31085" author="pjones" created="Wed, 14 Mar 2012 08:16:45 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;Could you look into this one please?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="31265" author="laisiyao" created="Thu, 15 Mar 2012 02:29:40 +0000"  >&lt;p&gt;The first ll_get_dir_page() failed with errno -1 (-EPERM), this looks to be returned from MDS, could you check MDS log?&lt;/p&gt;

&lt;p&gt;This assert is caused by statahead code, which is buggy in 2.1 code, and it&apos;s fixed in 2.2, the patch is at &lt;a href=&quot;http://review.whamcloud.com/#change,1208&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,1208&lt;/a&gt;, but unfortunately it depends on some other changes, so it can&apos;t be backport to 2.1 directly. To fix this issue, you can disable statahead by `echo 0 &amp;gt; /proc/fs/lustre/llite/&amp;lt;client_device&amp;gt;/statahead_max` on client, or else I can help backport the patch to 2.1, which may take a little time.&lt;/p&gt;</comment>
                            <comment id="32833" author="pjones" created="Thu, 29 Mar 2012 09:49:29 +0000"  >&lt;p&gt;Bull will workaround this by disabling until they upgrade to 2.2+ &lt;/p&gt;</comment>
                            <comment id="42564" author="bogl" created="Wed, 1 Aug 2012 16:41:10 +0000"  >&lt;p&gt;Putting in a fix to disable it by default.&lt;br/&gt;
This is just a temporary workaround until we have a proper fix.&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/#change,3512&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,3512&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzva0n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>5157</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>