<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:21:59 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2056] SWL - osd_trans_start()) ASSERTION( oti-&gt;oti_w_locks == 0 ) failed:</title>
                <link>https://jira.whamcloud.com/browse/LU-2056</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;&amp;lt;ConMan&amp;gt; Console [hyperion-rst6] log at 2012-09-30 16:00:00 PDT.
2012-09-30 16:20:23          [A[B[1;2B[1;2B[1;2B[1;2B[1;2B[B[B[B[B[B[BLustre: 4162:0:(client.c:1917:ptlrpc_expire_one_request()) @@@ Request  sent has timed out &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; slow reply: [sent 1349048656/real 1349048656]  req@ffff880176df8c00 x1414547178955781/t0(0) o400-&amp;gt;MGC192.168.127.6@o2ib@0@lo:26/25 lens 224/224 e 0 to 1 dl 1349048762 ref 1 fl Rpc:RXN/0/ffffffff rc 0/-1
2012-09-30 16:46:02 LustreError: 166-1: MGC192.168.127.6@o2ib: Connection to MGS (at 0@lo) was lost; in progress operations using &lt;span class=&quot;code-keyword&quot;&gt;this&lt;/span&gt; service will fail
2012-09-30 16:46:02 Lustre: MGS: Client b825c79a-32bd-3ab8-c5fa-b66aeb9bb741 (at 0@lo) reconnecting
2012-09-30 16:46:02 LustreError: 4242:0:(obd_class.h:527:obd_set_info_async()) obd_set_info_async: dev 0 no operation
2012-09-30 16:47:09 Lustre: MGC192.168.127.6@o2ib: Reactivating &lt;span class=&quot;code-keyword&quot;&gt;import&lt;/span&gt;
2012-09-30 16:47:09 Lustre: MGC192.168.127.6@o2ib: Connection restored to MGS (at 0@lo)

&amp;lt;ConMan&amp;gt; Console [hyperion-rst6] log at 2012-09-30 17:00:00 PDT.
2012-09-30 17:02:38 LustreError: 6069:0:(osd_handler.c:837:osd_trans_start()) ASSERTION( oti-&amp;gt;oti_w_locks == 0 ) failed: 

2012-09-30 17:02:38 LustreError: 6069:0:(osd_handler.c:837:osd_trans_start()) LBUG
2012-09-30 17:02:38 Pid: 6069, comm: mdt_rdpg03_002
2012-09-30 17:02:38

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;For some reason, stack did not dump, but vmcore obtained&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;crash&amp;gt; bt
PID: 6069   TASK: ffff880141836aa0  CPU: 7   COMMAND: &lt;span class=&quot;code-quote&quot;&gt;&quot;mdt_rdpg03_002&quot;&lt;/span&gt;
 #0 [ffff880156e759c8] machine_kexec at ffffffff8103281b
 #1 [ffff880156e75a28] crash_kexec at ffffffff810ba792
 #2 [ffff880156e75af8] panic at ffffffff814fd591
 #3 [ffff880156e75b78] lbug_with_loc at ffffffffa0393f6b [libcfs]
 #4 [ffff880156e75b98] osd_trans_start at ffffffffa0a8d2bc [osd_ldiskfs]
 #5 [ffff880156e75bd8] mdd_trans_start at ffffffffa0f043a4 [mdd]
 #6 [ffff880156e75be8] mdd_close at ffffffffa0edf4f6 [mdd]
 #7 [ffff880156e75c58] cml_close at ffffffffa06baef6 [cmm]
 #8 [ffff880156e75c88] mdt_mfd_close at ffffffffa0f8a18e [mdt]
 #9 [ffff880156e75ce8] mdt_close at ffffffffa0f8ae0a [mdt]
#10 [ffff880156e75d38] mdt_handle_common at ffffffffa0f66802 [mdt]
#11 [ffff880156e75d88] mdt_readpage_handle at ffffffffa0f676d5 [mdt]
#12 [ffff880156e75d98] ptlrpc_server_handle_request at ffffffffa0966b3c [ptlrpc]
#13 [ffff880156e75e98] ptlrpc_main at ffffffffa0968111 [ptlrpc]
#14 [ffff880156e75f48] kernel_thread at ffffffff8100c14a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>LLNL/Hyperion lustre-reviews 9573</environment>
        <key id="16189">LU-2056</key>
            <summary>SWL - osd_trans_start()) ASSERTION( oti-&gt;oti_w_locks == 0 ) failed:</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="hongchao.zhang">Hongchao Zhang</assignee>
                                    <reporter username="cliffw">Cliff White</reporter>
                        <labels>
                            <label>HB</label>
                    </labels>
                <created>Sun, 30 Sep 2012 21:30:33 +0000</created>
                <updated>Fri, 19 Apr 2013 14:20:21 +0000</updated>
                            <resolved>Mon, 14 Jan 2013 15:21:43 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                                    <fixVersion>Lustre 2.4.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="45785" author="cliffw" created="Sun, 30 Sep 2012 21:33:52 +0000"  >&lt;p&gt;VMcore is at ~cliffw/lu2056/vmcore-rst6.01Oct on brent&lt;/p&gt;</comment>
                            <comment id="45786" author="cliffw" created="Sun, 30 Sep 2012 21:34:31 +0000"  >&lt;p&gt;vmcore is at ~cliffw/lu2056/vmcore-rst6.01Oct on brent&lt;/p&gt;</comment>
                            <comment id="45793" author="liang" created="Mon, 1 Oct 2012 03:51:46 +0000"  >&lt;p&gt;comment in osd_trans_start()&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;                /*
                 * XXX: current rule is that we first start tx,
                 *      then lock object(s), but we can&apos;t use
                 *      this rule for data (due to locking specifics
                 *      in ldiskfs). also in long-term we&apos;d like to
                 *      use usually-used (locks;tx) ordering. so,
                 *      UGLY thing is that we&apos;ll use one ordering for
                 *      data (ofd) and reverse ordering for metadata
                 *      (mdd). then at some point we&apos;ll fix the latter
                 */
                if (dev-&amp;gt;od_is_md) {
                        LASSERT(oti-&amp;gt;oti_r_locks == 0);
                        LASSERT(oti-&amp;gt;oti_w_locks == 0);
                }

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;But code in mdd_close()&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;             .....
2457         mdd_write_lock(env, mdd_obj, MOR_TGT_CHILD);
2458         if (handle == NULL &amp;amp;&amp;amp; mdd_obj-&amp;gt;mod_count == 1 &amp;amp;&amp;amp;
2459             (mdd_obj-&amp;gt;mod_flags &amp;amp; ORPHAN_OBJ) != 0) {
2460                 mdd_write_unlock(env, mdd_obj);
2461                 goto again;
2462         }
             ......
2503                         if (handle == NULL) {
2504                                 handle = mdd_trans_create(env, mdo2mdd(obj)     );
2505                                 if (IS_ERR(handle))
2506                                         GOTO(out, rc = PTR_ERR(handle));
2507 
2508                                 rc = mdd_declare_object_kill(env, mdd_obj,      ma,
2509                                                              handle);
2510                                 if (rc)
2511                                         GOTO(out, rc);
2512 
2513                                 rc = mdd_declare_changelog_store(env, mdd,
2514                                                                  NULL, hand     le);
2515                                 if (rc)
2516                                         GOTO(stop, rc);
2517 
2518                                 rc = mdd_trans_start(env, mdo2mdd(obj), han     dle);

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;We start transaction &lt;em&gt;after&lt;/em&gt; locking the object, which violates the rule set in osd_trans_start().&lt;/p&gt;</comment>
                            <comment id="45805" author="liang" created="Mon, 1 Oct 2012 12:15:44 +0000"  >&lt;p&gt;I&apos;ve posted a patch for this: &lt;a href=&quot;http://review.whamcloud.com/4145&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/4145&lt;/a&gt; , it&apos;s better to try it after it&apos;s reviewed.&lt;/p&gt;</comment>
                            <comment id="45859" author="liang" created="Tue, 2 Oct 2012 09:39:40 +0000"  >&lt;p&gt;I made some changes for wangdi&apos;s review and rebased previous patch to 2.3 (previous one is for master), unfortunately I lost history of it by doing this. New patch is: &lt;a href=&quot;http://review.whamcloud.com/#change,4152&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,4152&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="46113" author="liang" created="Mon, 8 Oct 2012 00:55:50 +0000"  >&lt;p&gt;patch landed to 2.3 so it&apos;s not a 2.3 blocker anymore, but still need to fix it for master&lt;/p&gt;</comment>
                            <comment id="47387" author="hongchao.zhang" created="Mon, 5 Nov 2012 02:54:59 +0000"  >&lt;p&gt;the patch against master is tracked at &lt;a href=&quot;http://review.whamcloud.com/#change,4461&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,4461&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="49092" author="green" created="Tue, 11 Dec 2012 22:37:06 +0000"  >&lt;p&gt;I seem to be hitting this (in form of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2443&quot; title=&quot;osd_object_write_lock()) ASSERTION( obj-&amp;gt;oo_owner != env )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2443&quot;&gt;&lt;del&gt;LU-2443&lt;/del&gt;&lt;/a&gt; during racer shutdown) fairly regularly now, please update the patch.&lt;/p&gt;</comment>
                            <comment id="49247" author="liang" created="Fri, 14 Dec 2012 10:01:58 +0000"  >&lt;p&gt;reassign to hongchao because he ported the patch to master&lt;/p&gt;</comment>
                            <comment id="50341" author="jlevi" created="Fri, 11 Jan 2013 12:27:23 +0000"  >&lt;p&gt;Since Change, 4461 has landed, can this ticket be closed?&lt;/p&gt;</comment>
                            <comment id="50438" author="jlevi" created="Mon, 14 Jan 2013 15:21:43 +0000"  >&lt;p&gt;All patches are landed so closing ticket. Please reopen if more work is needed.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzv4q7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>4299</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>