<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:13:33 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1105] file creation fails with Input/Output error due to MDT - OST reconnections</title>
                <link>https://jira.whamcloud.com/browse/LU-1105</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;After creating hundreds of files, the creation fails with &quot;Input/Ouput error&quot;.&lt;/p&gt;

&lt;p&gt;Here is an extract from MDS log.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:02020000:5.0:1329310922.993555:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.4@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993559:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.3@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993563:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.4@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993566:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.3@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993589:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.3@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993592:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.3@o2ib. The ost_connect operation failed with -114
00000100:02020000:5.0:1329310922.993595:0:3101:0:(client.c:1125:ptlrpc_check_status()) 11-0: an error occurred while communicating with 10.17.0.3@o2ib. The ost_connect operation failed with -114
00020000:00020000:7.0F:1329310937.993023:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 8/30: rc = -11
00020000:00020000:7.0:1329310937.993032:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 15/30: rc = -11
00020000:00020000:7.0:1329310937.993035:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 16/30: rc = -11
00020000:00020000:7.0:1329310937.993037:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 25/30: rc = -11
00020000:00020000:7.0:1329310937.993040:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 12/30: rc = -11
00020000:00020000:7.0:1329310937.993042:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 9/30: rc = -11
00020000:00020000:7.0:1329310937.993044:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 5/30: rc = -11
00020000:00020000:7.0:1329310937.993046:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 19/30: rc = -11
00020000:00020000:7.0:1329310937.993049:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 21/30: rc = -11
00020000:00020000:7.0:1329310937.993051:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 28/30: rc = -11
00020000:00020000:7.0:1329310937.993053:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 4/30: rc = -11
00020000:00020000:7.0:1329310937.993055:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 27/30: rc = -11
00020000:00020000:7.0:1329310937.993057:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 22/30: rc = -11
00020000:00020000:7.0:1329310937.993060:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 0/30: rc = -11
00020000:00020000:7.0:1329310937.993062:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 11/30: rc = -11
00020000:00020000:7.0:1329310937.993064:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 20/30: rc = -11
00020000:00020000:7.0:1329310937.993066:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 7/30: rc = -11
00020000:00020000:7.0:1329310937.993068:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 26/30: rc = -11
00020000:00020000:7.0:1329310937.993071:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 23/30: rc = -11
00020000:00020000:7.0:1329310937.993073:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 13/30: rc = -11
00020000:00020000:7.0:1329310937.993075:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 2/30: rc = -11
00020000:00020000:7.0:1329310937.993077:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 24/30: rc = -11
00020000:00020000:7.0:1329310937.993080:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 6/30: rc = -11
00020000:00020000:7.0:1329310937.993082:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 14/30: rc = -11
00020000:00020000:7.0:1329310937.993084:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 10/30: rc = -11
00020000:00020000:7.0:1329310937.993086:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 18/30: rc = -11
00020000:00020000:7.0:1329310937.993090:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 3/30: rc = -11
00020000:00020000:7.0:1329310937.993100:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 17/30: rc = -11
00020000:00020000:7.0:1329310937.993103:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 29/30: rc = -11
00020000:00020000:7.0:1329310937.993109:0:3100:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 1/30: rc = -11
00020000:00020000:3.0F:1329310937.993138:0:3354:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 7/30: rc = -5
00020000:00020000:3.0:1329310937.993151:0:3354:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 14/30: rc = -5
00020000:00020000:3.0:1329310937.993158:0:3354:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 15/30: rc = -5
00020000:00020000:3.0:1329310937.993164:0:3354:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 24/30: rc = -5
00020000:00020000:3.0:1329310937.993171:0:3354:0:(lov_request.c:569:lov_update_create_set()) error creating fid 0x6a39 sub-object on OST idx 11/30: rc = -5
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Here is an extract from OSS log:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00010000:00020000:3.0F:1329310843.814130:0:15034:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc6f4, theirs 0x561e1655a7ff215f)
00010000:00020000:3.0:1329310843.814139:0:15034:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff88057cd77000 x1393874236755056/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
00010000:00020000:3.0:1329310843.814178:0:15034:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc733, theirs 0x561e1655a7ff2189)
00010000:00020000:7.0F:1329310843.814181:0:15008:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc82f, theirs 0x561e1655a7ff21b3)
00010000:00020000:3.0:1329310843.814181:0:15034:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff88061c7b8000 x1393874236755058/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
00010000:00020000:7.0:1329310843.814187:0:15008:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff8805bd75f400 x1393874236755060/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
00010000:00020000:7.0:1329310843.814211:0:15008:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc8d7, theirs 0x561e1655a7ff221c)
00010000:00020000:3.0:1329310843.814211:0:15034:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc859, theirs 0x561e1655a7ff2207)
00010000:00020000:7.0:1329310843.814215:0:15008:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff8805bd4f8400 x1393874236755065/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
00010000:00020000:4.0F:1329310843.814215:0:15032:0:(ldlm_lib.c:620:target_handle_reconnect()) scratch-MDT0000-mdtlov_UUID reconnecting from NET_0x500000a110002_UUID, handle mismatch (ours 0x1d014c26baadc8c2, theirs 0x561e1655a7ff21dd)
00010000:00020000:3.0:1329310843.814215:0:15034:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff8805cd235850 x1393874236755064/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
00010000:00020000:4.0:1329310843.814222:0:15032:0:(ldlm_lib.c:2129:target_send_reply_msg()) @@@ processing error (-114)  req@ffff8805c0977000 x1393874236755062/t0(0) o-1-&amp;gt;&amp;lt;?&amp;gt;@&amp;lt;?&amp;gt;:0/0 lens 368/264 e 0 to 0 dl 1329310943 ref 1 fl Interpret:/ffffffff/ffffffff rc -114/-1
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
</description>
                <environment>Lustre 2.1 with Bull patches, bullxlinux6.1 x86_64 (based on Redhat 6.1)&lt;br/&gt;
file system formated with lustre 2.0.</environment>
        <key id="13188">LU-1105</key>
            <summary>file creation fails with Input/Output error due to MDT - OST reconnections</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="pichong">Gregoire Pichon</reporter>
                        <labels>
                    </labels>
                <created>Wed, 15 Feb 2012 11:13:32 +0000</created>
                <updated>Mon, 20 Feb 2012 10:12:46 +0000</updated>
                            <resolved>Mon, 20 Feb 2012 10:12:46 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="28745" author="pichong" created="Wed, 15 Feb 2012 12:08:10 +0000"  >&lt;p&gt;The file system is made of 2 OSSs with 15 OSTs each. The MGT and the MDT are on the same serveur.&lt;/p&gt;</comment>
                            <comment id="28789" author="pjones" created="Wed, 15 Feb 2012 15:29:53 +0000"  >&lt;p&gt;Bobi&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="28863" author="pichong" created="Thu, 16 Feb 2012 04:09:05 +0000"  >&lt;p&gt;I have uploaded files on the whamcloud ftp server:&lt;br/&gt;
2557929999 15586051 dk_all_CLIENT&lt;br/&gt;
3591178222 34920242 dk_all_MDS&lt;br/&gt;
3346219849 24249412 dk_all_OSS1&lt;br/&gt;
2301728498 23701193 dk_all_OSS2&lt;/p&gt;

&lt;p&gt;They contains the lctl dk logs of the filesystem with much more history.&lt;/p&gt;

&lt;p&gt;The MDS/MGS has address 10.17.0.12@o2ib&lt;br/&gt;
The OSSs have addresses 10.17.0.3@o2ib and 10.17.0.4@o2ib&lt;/p&gt;

&lt;p&gt;Hope this helps.&lt;br/&gt;
Gr&#233;goire.&lt;/p&gt;</comment>
                            <comment id="28890" author="bobijam" created="Thu, 16 Feb 2012 09:54:04 +0000"  >&lt;p&gt;From OSS logs&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;target_handle_connect()) scratch-OST000b: received MDS connection from NID 10.17.0.2@o2ib, removing former export from NID 10.17.0.12@o2ib&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;During file creations, the MDS switched its connection NID from 10.17.0.12@o2ib to 10.17.0.2@o2ib, which causing all the object create requests from old MDS export failed. What happened to the MDS network do you know?&lt;/p&gt;</comment>
                            <comment id="29475" author="pichong" created="Mon, 20 Feb 2012 05:21:31 +0000"  >&lt;p&gt;The problem comes from a wrong configuration of our filesystem: there are several MGS in the cluster.&lt;br/&gt;
Sorry, for this fake problem.&lt;br/&gt;
The ticket can be closed.&lt;/p&gt;</comment>
                            <comment id="29478" author="pjones" created="Mon, 20 Feb 2012 10:12:46 +0000"  >&lt;p&gt;ok thanks Gregoire!&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="10836" name="dk_MDS" size="42757" author="pichong" created="Wed, 15 Feb 2012 12:08:10 +0000"/>
                            <attachment id="10837" name="dk_OSS1" size="22598" author="pichong" created="Wed, 15 Feb 2012 12:08:10 +0000"/>
                            <attachment id="10838" name="dk_OSS2" size="21518" author="pichong" created="Wed, 15 Feb 2012 12:08:10 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvhbz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6457</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>