<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:22:36 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2129] ASSERTION( last_rec-&gt;lrh_index == tail-&gt;lrt_index )</title>
                <link>https://jira.whamcloud.com/browse/LU-2129</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Lustre: DEBUG MARKER: ----&lt;del&gt;============= acceptance-small: parallel-scale ============&lt;/del&gt;---- Tue Oct 9 09:38:01 PDT 2012&lt;br/&gt;
Lustre: DEBUG MARKER: excepting tests: parallel_grouplock&lt;br/&gt;
Lustre: DEBUG MARKER: Using TIMEOUT=20&lt;br/&gt;
LustreError: 13309:0:(osd_io.c:1062:osd_ldiskfs_write_record()) sdd1: error reading offset 12288 (block 3): rc = -28&lt;br/&gt;
LustreError: 13309:0:(llog_osd.c:175:llog_osd_write_blob()) lustre-MDT0000-osd: error writing log buffer: rc = -28&lt;br/&gt;
LustreError: 13309:0:(mgs_llog.c:738:record_lcfg()) failed -28&lt;br/&gt;
LustreError: 13309:0:(mgs_llog.c:1074:mgs_write_log_direct_all()) MGS: writing log lustre-params: rc = -28&lt;br/&gt;
LustreError: 13309:0:(osd_io.c:1062:osd_ldiskfs_write_record()) sdd1: error reading offset 12288 (block 3): rc = -28&lt;br/&gt;
LustreError: 13309:0:(llog_osd.c:175:llog_osd_write_blob()) lustre-MDT0000-osd: error writing log buffer: rc = -28&lt;br/&gt;
LustreError: 13309:0:(mgs_llog.c:738:record_lcfg()) failed -28&lt;br/&gt;
LustreError: 13309:0:(mgs_llog.c:1074:mgs_write_log_direct_all()) MGS: writing log lustre-OST0000: rc = -28&lt;br/&gt;
LustreError: 13309:0:(mgs_llog.c:2956:mgs_write_log_param()) err -28 on param &apos;sys.jobid_var=procname_uid&apos;&lt;br/&gt;
LustreError: 13309:0:(mgs_handler.c:926:mgs_iocontrol()) MGS: setparam err: rc = -28&lt;br/&gt;
LustreError: 11580:0:(llog_osd.c:579:llog_osd_next_block()) ASSERTION( last_rec-&amp;gt;lrh_index == tail-&amp;gt;lrt_index ) failed: &lt;br/&gt;
LustreError: 11580:0:(llog_osd.c:579:llog_osd_next_block()) LBUG&lt;br/&gt;
Pid: 11580, comm: ll_mgs_0003&lt;/p&gt;

&lt;p&gt;Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0991905&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x55/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0991f17&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x47/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0cd6435&amp;gt;&amp;#93;&lt;/span&gt; llog_osd_next_block+0xa55/0xa60 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa151d436&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_flags+0xb6/0x210 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa153a80c&amp;gt;&amp;#93;&lt;/span&gt; llog_origin_handle_next_block+0x50c/0x780 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa1747f93&amp;gt;&amp;#93;&lt;/span&gt; mgs_handle+0xb13/0x11e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mgs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa09a2621&amp;gt;&amp;#93;&lt;/span&gt; ? libcfs_debug_msg+0x41/0x50 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152d8dc&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request+0x41c/0xe00 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e309&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up_common+0x59/0x90&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810533f3&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up+0x53/0x70&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152eecc&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0xc0c/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c14a&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c140&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;/p&gt;

&lt;p&gt;Kernel panic - not syncing: LBUG&lt;br/&gt;
Pid: 11580, comm: ll_mgs_0003 Not tainted 2.6.32-279.5.1.el6_lustre.x86_64 #1&lt;br/&gt;
Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814fd58a&amp;gt;&amp;#93;&lt;/span&gt; ? panic+0xa0/0x168&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0991f6b&amp;gt;&amp;#93;&lt;/span&gt; ? lbug_with_loc+0x9b/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0cd6435&amp;gt;&amp;#93;&lt;/span&gt; ? llog_osd_next_block+0xa55/0xa60 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa151d436&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_flags+0xb6/0x210 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa153a80c&amp;gt;&amp;#93;&lt;/span&gt; ? llog_origin_handle_next_block+0x50c/0x780 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa1747f93&amp;gt;&amp;#93;&lt;/span&gt; ? mgs_handle+0xb13/0x11e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mgs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa09a2621&amp;gt;&amp;#93;&lt;/span&gt; ? libcfs_debug_msg+0x41/0x50 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152d8dc&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_server_handle_request+0x41c/0xe00 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e309&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up_common+0x59/0x90&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810533f3&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up+0x53/0x70&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152eecc&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0xc0c/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c14a&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0xa/0x20&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa152e2c0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x19f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c140&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;/p&gt;</description>
                <environment>&amp;nbsp;&lt;a href=&quot;https://build.whamcloud.com/job/lustre-master/951/&quot;&gt;https://build.whamcloud.com/job/lustre-master/951/&lt;/a&gt; &lt;br/&gt;
On opensfs with 1 mds, 4 oss, 24 clients</environment>
        <key id="16302">LU-2129</key>
            <summary>ASSERTION( last_rec-&gt;lrh_index == tail-&gt;lrt_index )</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="tappro">Mikhail Pershin</assignee>
                                    <reporter username="mdiep">Minh Diep</reporter>
                        <labels>
                            <label>NFBlocker</label>
                    </labels>
                <created>Tue, 9 Oct 2012 12:57:35 +0000</created>
                <updated>Tue, 20 Nov 2012 14:23:19 +0000</updated>
                            <resolved>Tue, 20 Nov 2012 14:23:19 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                                    <fixVersion>Lustre 2.4.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="46258" author="green" created="Tue, 9 Oct 2012 13:05:43 +0000"  >&lt;p&gt;This happens in my testing at random tests&lt;br/&gt;
last occurence today in the morning, crashdump available:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;[10933.785890] LustreError: 11126:0:(lmv_obd.c:1190:lmv_statfs()) can&apos;t stat MDS #0 (lustre-MDT0000-mdc-ffff880096259bf0), error -5
[10933.786846] LustreError: 11126:0:(llite_lib.c:1558:ll_statfs_internal()) md_statfs fails: rc = -5
[10935.038782] Lustre: DEBUG MARKER: == replay-single test 21: |X| open(O_CREAT), unlink touch &lt;span class=&quot;code-keyword&quot;&gt;new&lt;/span&gt;, replay, close (test mds_cleanup_orphans) == 06:04:11 (1349777051)
[10935.209519] Turning device loop0 (0x700000) read-only
[10935.233110] Lustre: DEBUG MARKER: mds1 REPLAY BARRIER on lustre-MDT0000
[10935.239897] Lustre: DEBUG MARKER: local REPLAY BARRIER on lustre-MDT0000
[10935.555060] Removing read-only on unknown block (0x700000)
[10945.911054] LDISKFS-fs (loop0): recovery complete
[10945.912650] LDISKFS-fs (loop0): mounted filesystem with ordered data mode. quota=on. Opts: 
[10945.944018] LustreError: 11387:0:(llog_osd.c:579:llog_osd_next_block()) ASSERTION( last_rec-&amp;gt;lrh_index == tail-&amp;gt;lrt_index ) failed: 
[10945.944868] LustreError: 11387:0:(llog_osd.c:579:llog_osd_next_block()) LBUG
[10945.945387] Pid: 11387, comm: ll_mgs_0001
[10945.945389] 
[10945.945389] Call Trace:
[10945.945410]  [&amp;lt;ffffffffa0c24915&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
[10945.945424]  [&amp;lt;ffffffffa0c24f27&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
[10945.945469]  [&amp;lt;ffffffffa1124af5&amp;gt;] llog_osd_next_block+0xa55/0xa60 [obdclass]
[10945.945521]  [&amp;lt;ffffffffa1288dc6&amp;gt;] ? lustre_pack_reply_flags+0xb6/0x210 [ptlrpc]
[10945.945542]  [&amp;lt;ffffffffa12a542c&amp;gt;] llog_origin_handle_next_block+0x55c/0x780 [ptlrpc]
[10945.945549]  [&amp;lt;ffffffffa066ef73&amp;gt;] mgs_handle+0xb13/0x11e0 [mgs]
[10945.945557]  [&amp;lt;ffffffffa0c356d1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
[10945.945576]  [&amp;lt;ffffffffa1297853&amp;gt;] ptlrpc_server_handle_request+0x463/0xe70 [ptlrpc]
[10945.945587]  [&amp;lt;ffffffffa0c2566e&amp;gt;] ? cfs_timer_arm+0xe/0x10 [libcfs]
[10945.945614]  [&amp;lt;ffffffffa1290541&amp;gt;] ? ptlrpc_wait_event+0xb1/0x2a0 [ptlrpc]
[10945.945619]  [&amp;lt;ffffffff81051f73&amp;gt;] ? __wake_up+0x53/0x70
[10945.945646]  [&amp;lt;ffffffffa129a3ea&amp;gt;] ptlrpc_main+0xb9a/0x1960 [ptlrpc]
[10945.945673]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.945676]  [&amp;lt;ffffffff8100c14a&amp;gt;] child_rip+0xa/0x20
[10945.945702]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.945744]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.945748]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
[10945.945749] 
[10945.948136] Kernel panic - not syncing: LBUG
[10945.948138] Pid: 11387, comm: ll_mgs_0001 Not tainted 2.6.32-debug #6
[10945.948139] Call Trace:
[10945.948146]  [&amp;lt;ffffffff814f75e4&amp;gt;] ? panic+0xa0/0x168
[10945.948155]  [&amp;lt;ffffffffa0c24f7b&amp;gt;] ? lbug_with_loc+0x9b/0xb0 [libcfs]
[10945.948198]  [&amp;lt;ffffffffa1124af5&amp;gt;] ? llog_osd_next_block+0xa55/0xa60 [obdclass]
[10945.948242]  [&amp;lt;ffffffffa1288dc6&amp;gt;] ? lustre_pack_reply_flags+0xb6/0x210 [ptlrpc]
[10945.948285]  [&amp;lt;ffffffffa12a542c&amp;gt;] ? llog_origin_handle_next_block+0x55c/0x780 [ptlrpc]
[10945.948296]  [&amp;lt;ffffffffa066ef73&amp;gt;] ? mgs_handle+0xb13/0x11e0 [mgs]
[10945.948312]  [&amp;lt;ffffffffa0c356d1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
[10945.948354]  [&amp;lt;ffffffffa1297853&amp;gt;] ? ptlrpc_server_handle_request+0x463/0xe70 [ptlrpc]
[10945.948368]  [&amp;lt;ffffffffa0c2566e&amp;gt;] ? cfs_timer_arm+0xe/0x10 [libcfs]
[10945.948409]  [&amp;lt;ffffffffa1290541&amp;gt;] ? ptlrpc_wait_event+0xb1/0x2a0 [ptlrpc]
[10945.948413]  [&amp;lt;ffffffff81051f73&amp;gt;] ? __wake_up+0x53/0x70
[10945.948452]  [&amp;lt;ffffffffa129a3ea&amp;gt;] ? ptlrpc_main+0xb9a/0x1960 [ptlrpc]
[10945.948492]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.948496]  [&amp;lt;ffffffff8100c14a&amp;gt;] ? child_rip+0xa/0x20
[10945.948540]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.948620]  [&amp;lt;ffffffffa1299850&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[10945.948624]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="46308" author="tappro" created="Wed, 10 Oct 2012 03:50:36 +0000"  >&lt;p&gt;I&apos;ve added debug to get more information about this issue:&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,4240&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,4240&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Oleg, please use it if you can reproduce this bug&lt;/p&gt;</comment>
                            <comment id="46582" author="green" created="Mon, 15 Oct 2012 12:31:09 +0000"  >&lt;p&gt;Just reproduced&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[49201.778332] Lustre: DEBUG MARKER: == replay-single test 40: cause recovery in ptlrpc, ensure IO continues == 12:28:41 (1350318521)
[49201.795828] Lustre: DEBUG MARKER: multiop /mnt/lustre/f.replay-single.40 OS_c
[49214.016506] LDISKFS-fs (loop0): mounted filesystem with ordered data mode. quota=on. Opts: 
[49214.071707] LustreError: 2626:0:(llog_osd.c:588:llog_osd_next_block()) ASSERTION( last_rec-&amp;gt;lrh_index == tail-&amp;gt;lrt_index ) failed: Rec idx 0, tail idx -30720 in llog #0x2#0x1#00000000 offset 92312, len 2200
[49214.072538] LustreError: 2626:0:(llog_osd.c:588:llog_osd_next_block()) LBUG
[49214.072817] Pid: 2626, comm: ll_mgs_0001
[49214.073065] 
[49214.073065] Call Trace:
[49214.073473]  [&amp;lt;ffffffffa0b34915&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
[49214.073788]  [&amp;lt;ffffffffa0b34f27&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
[49214.074118]  [&amp;lt;ffffffffa0ecf5f9&amp;gt;] llog_osd_next_block+0xa89/0xa90 [obdclass]
[49214.074455]  [&amp;lt;ffffffffa1092a96&amp;gt;] ? lustre_pack_reply_flags+0xb6/0x210 [ptlrpc]
[49214.074931]  [&amp;lt;ffffffffa10af05c&amp;gt;] llog_origin_handle_next_block+0x55c/0x780 [ptlrpc]
[49214.075406]  [&amp;lt;ffffffffa06bef73&amp;gt;] mgs_handle+0xb13/0x11e0 [mgs]
[49214.075679]  [&amp;lt;ffffffffa0b456d1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
[49214.075980]  [&amp;lt;ffffffffa10a1483&amp;gt;] ptlrpc_server_handle_request+0x463/0xe70 [ptlrpc]
[49214.076443]  [&amp;lt;ffffffffa0b3566e&amp;gt;] ? cfs_timer_arm+0xe/0x10 [libcfs]
[49214.076736]  [&amp;lt;ffffffffa109a171&amp;gt;] ? ptlrpc_wait_event+0xb1/0x2a0 [ptlrpc]
[49214.077051]  [&amp;lt;ffffffff81051f73&amp;gt;] ? __wake_up+0x53/0x70
[49214.077330]  [&amp;lt;ffffffffa10a401a&amp;gt;] ptlrpc_main+0xb9a/0x1960 [ptlrpc]
[49214.077710]  [&amp;lt;ffffffffa10a3480&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[49214.077993]  [&amp;lt;ffffffff8100c14a&amp;gt;] child_rip+0xa/0x20
[49214.078267]  [&amp;lt;ffffffffa10a3480&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[49214.078583]  [&amp;lt;ffffffffa10a3480&amp;gt;] ? ptlrpc_main+0x0/0x1960 [ptlrpc]
[49214.078860]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="46672" author="tappro" created="Wed, 17 Oct 2012 09:44:40 +0000"  >&lt;p&gt;As I suspected the llog contains partially written records. Thus must be result of llog_osd_write_blob() called with buffer to write. In that case there are 3 separated writes actually - record header, buffer and record tail. So we can have first write successful but others not which causes assertion upon read. &lt;/p&gt;
</comment>
                            <comment id="46739" author="tappro" created="Thu, 18 Oct 2012 12:51:53 +0000"  >&lt;p&gt;Possible solution would be the locking with write lock around those 3 writes and read lock in llog_osd_next_block(). Given the fact &quot;3 writes&quot; case is not common (used only for config llogs) that shouldn&apos;t cause lot of contentions.&lt;/p&gt;

&lt;p&gt;Meanwhile I wonder can we avoid those &apos;3 writes&apos; at all, demanding llog_write be not called with external buffer but only with fully prepared llog record. That means mgs should prepare llog record with copying lustre_cfg buffer. Such overhead is not critical for MGS but we are avoiding that buggy case with 3 separate writes in llog_osd &lt;/p&gt;</comment>
                            <comment id="46762" author="tappro" created="Fri, 19 Oct 2012 01:31:56 +0000"  >&lt;p&gt;Fix with locking, write lock envelopes problematic multiple writes while dt_read() is protected with read lock.&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/4303&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/4303&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Another and probably better way could be removal of those multiple writes and write llog record only by single block but would require more work, though will cleanup llog nicely&lt;/p&gt;</comment>
                            <comment id="47708" author="tappro" created="Mon, 12 Nov 2012 18:53:44 +0000"  >&lt;p&gt;patch is ready for landing, need confirmation from Oleg that bug it not seen anymore&lt;/p&gt;</comment>
                            <comment id="48116" author="adilger" created="Tue, 20 Nov 2012 14:23:19 +0000"  >&lt;p&gt;Patch landed, closing bug.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzv9uv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>5131</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>