<!-- 
RSS generated by JIRA (5.2.4#845-sha1:c9f4cc41abe72fb236945343a1f485c2c844dac9) at Wed Jun 19 00:56:37 CDT 2013

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary add field=key&field=summary to the URL of your request.
For example:
http://www.couchbase.com/issues/si/jira.issueviews:issue-xml/MB-5298/MB-5298.xml?field=key&field=summary
-->
<rss version="0.92" >
<channel>
    <title>Couchbase</title>
    <link>http://www.couchbase.com/issues</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>5.2.4</version>
        <build-number>845</build-number>
        <build-date>26-12-2012</build-date>
    </build-info>

<item>
            <title>[MB-5298] Rebalance failed with reason {case_clause,{{ok,replica},{ok,replica}}} when rebalancing out a node which was failed over due to netwrok connectivity issues but it re-appears while rebalancing</title>
                <link>http://www.couchbase.com/issues/browse/MB-5298</link>
                <project id="10010" key="MB">Couchbase Server</project>
                        <description>Failing testcase&lt;br/&gt;
failovertests.FailoverTests.test_failover_firewall,replica=3,load_ratio=10&lt;br/&gt;
&lt;br/&gt;
[ns_server:info] [2012-05-14 13:26:46] [&lt;a href=&apos;mailto:ns_1@10.1.3.55&apos;&gt;ns_1@10.1.3.55&lt;/a&gt;:&amp;lt;0.3846.2&amp;gt;:ns_janitor:wait_for_memcached:286] Waiting for &amp;quot;default&amp;quot; on [&amp;#39;&lt;a href=&apos;mailto:ns_1@10.1.3.50&apos;&gt;ns_1@10.1.3.50&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.1.3.51&apos;&gt;ns_1@10.1.3.51&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.1.3.52&apos;&gt;ns_1@10.1.3.52&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.1.3.54&apos;&gt;ns_1@10.1.3.54&lt;/a&gt;&amp;#39;]&lt;br/&gt;
[ns_server:debug] [2012-05-14 13:26:46] [&lt;a href=&apos;mailto:ns_1@10.1.3.55&apos;&gt;ns_1@10.1.3.55&lt;/a&gt;:ns_bucket_worker:ns_bucket_sup:update_childs:91] Stopping child for dead bucket: {{per_bucket_sup,&amp;quot;default&amp;quot;},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;0.23773.0&amp;gt;,supervisor,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[single_bucket_sup]}&lt;br/&gt;
&lt;br/&gt;
[ns_server:debug] [2012-05-14 13:26:46] [&lt;a href=&apos;mailto:ns_1@10.1.3.55&apos;&gt;ns_1@10.1.3.55&lt;/a&gt;:&amp;lt;0.23773.0&amp;gt;:single_bucket_sup:top_loop:28] Delegating exit {&amp;#39;EXIT&amp;#39;,&amp;lt;0.23699.0&amp;gt;,shutdown} to child supervisor: &amp;lt;0.23774.0&amp;gt;&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
[error_logger:error] [2012-05-14 13:26:03] [&lt;a href=&apos;mailto:ns_1@10.1.3.50&apos;&gt;ns_1@10.1.3.50&lt;/a&gt;:error_logger:ale_error_logger_handler:log_report:72]&lt;br/&gt;
=========================CRASH REPORT=========================&lt;br/&gt;
&amp;nbsp;&amp;nbsp;crasher:&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;initial call: ns_vbucket_mover:init/1&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;pid: &amp;lt;0.29733.2&amp;gt;&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;registered_name: []&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;exception exit: {case_clause,{{ok,replica},{ok,replica}}}&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;in function  gen_server:terminate/6&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;ancestors: [&amp;lt;0.28176.2&amp;gt;]&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;messages: [{&amp;#39;EXIT&amp;#39;,&amp;lt;0.19829.3&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{exited,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;#39;EXIT&amp;#39;,&amp;lt;0.29733.2&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{case_clause,{{ok,replica},{ok,replica}}}}}},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;#39;EXIT&amp;#39;,&amp;lt;0.19792.3&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{exited,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;#39;EXIT&amp;#39;,&amp;lt;0.29733.2&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{case_clause,{{ok,replica},{ok,replica}}}}}},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;#39;EXIT&amp;#39;,&amp;lt;0.15598.3&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{exited,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;#39;EXIT&amp;#39;,&amp;lt;0.29733.2&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{case_clause,{{ok,replica},{ok,replica}}}}}}]</description>
                <environment>1.8.1-815-rel</environment>
            <key id="17060">MB-5298</key>
            <summary>Rebalance failed with reason {case_clause,{{ok,replica},{ok,replica}}} when rebalancing out a node which was failed over due to netwrok connectivity issues but it re-appears while rebalancing</summary>
                <type id="1" iconUrl="http://www.couchbase.com/issues/images/icons/issuetypes/bug.png">Bug</type>
                                <priority id="2" iconUrl="http://www.couchbase.com/issues/images/icons/priorities/critical.png">Critical</priority>
                    <status id="6" iconUrl="http://www.couchbase.com/issues/images/icons/statuses/closed.png">Closed</status>
                    <resolution id="1">Fixed</resolution>
                    <security id="10011">Public</security>
                        <assignee username="alkondratenko">Aleksey Kondratenko</assignee>
                                <reporter username="karan">Karan Kumar</reporter>
                        <labels>
                        <label>1.8.1-release-notes</label>
                    </labels>
                <created>Mon, 14 May 2012 15:34:40 -0500</created>
                <updated>Wed, 9 Jan 2013 23:13:18 -0600</updated>
                    <resolved>Mon, 17 Sep 2012 13:25:20 -0500</resolved>
                            <version>1.8.1-release-candidate</version>
                                <fixVersion>2.0</fixVersion>
                                <component>ns_server</component>
                                <votes>0</votes>
                        <watches>2</watches>
                                                    <comments>
                    <comment id="27229" author="alkondratenko" created="Mon, 14 May 2012 22:52:30 -0500"  >I&amp;#39;ve added more logging in affected area(s). Please retest with latest stuff</comment>
                    <comment id="27723" author="karan" created="Tue, 22 May 2012 00:01:46 -0500"  >Adding the latest logs from 181-832-rel</comment>
                    <comment id="27724" author="karan" created="Tue, 22 May 2012 00:03:40 -0500"  >Failing test:-&lt;br/&gt;
failovertests.FailoverTests.test_failover_firewall,replica=3,load_ratio=10</comment>
                    <comment id="27860" author="alkondratenko" created="Wed, 23 May 2012 12:24:39 -0500"  >Good find. Now we have evidence that one of previously firewalled and failed over nodes is being (seemingly gradually) un-firewalled in the middle of rebalance. When rest of cluster actually already ejected this node. But this node discovers it was ejected 1 minute after it&amp;#39;s replicator was able to push-replicate to one of existing nodes. We&amp;#39;re starting to really hit limits of our naive cluster orchestration approach.&lt;br/&gt;
</comment>
                    <comment id="27861" author="alkondratenko" created="Wed, 23 May 2012 12:25:42 -0500"  >I think reasonably simple treatment (still partial and naive) is to never restart replication automatically until janitor restarts it. It has some potential data safety implications though. I.e. janitor being really conservative in some cases will not restart replications that previously were automagically restarted. So not sure.</comment>
                    <comment id="27862" author="alkondratenko" created="Wed, 23 May 2012 12:27:31 -0500"  >Pull-based replication which is part of branch-18 would help here as well. Sadly we were not allowed to have it on branch-181.</comment>
                    <comment id="27863" author="alkondratenko" created="Wed, 23 May 2012 12:27:40 -0500"  >Need PM decision here</comment>
                    <comment id="27934" author="alkondratenko" created="Thu, 24 May 2012 12:48:09 -0500"  >May I ask for testing if this is a regression? My understanding no it&amp;#39;s not.</comment>
                    <comment id="27941" author="farshid" created="Thu, 24 May 2012 13:03:54 -0500"  >should we run this against 1.8.0 ?</comment>
                    <comment id="27943" author="alkondratenko" created="Thu, 24 May 2012 13:48:53 -0500"  >If you can, please do. I&amp;#39;m pretty sure you&amp;#39;ll hit this in 1.8.0 because failover &amp;amp; replication logic (hint: no quick failover was allowed for 1.8.1) is same.</comment>
                    <comment id="28228" author="karan" created="Tue, 29 May 2012 20:27:03 -0500"  >We are pretty much hitting this consistently on 181. &lt;br/&gt;
&lt;br/&gt;
</comment>
                    <comment id="28230" author="alkondratenko" created="Tue, 29 May 2012 20:28:45 -0500"  >Just stop doing this questionable practice of abusing firewall.</comment>
                    <comment id="28231" author="dipti" created="Tue, 29 May 2012 20:29:46 -0500"  >what are our options here to fix on 181?  Given the likely hood of hitting this is more, we should try to fix. </comment>
                    <comment id="28234" author="alkondratenko" created="Tue, 29 May 2012 20:35:43 -0500"  >My understanding is that probability of hitting this in practice approaches zero. We had this issue since 1.6.0 yet nobody seen reported this problem.</comment>
                    <comment id="28235" author="farshid" created="Tue, 29 May 2012 20:37:32 -0500"  >this is not about abusing the firewall . its about node coming back up or re-appearing after its failed over.&lt;br/&gt;
&lt;br/&gt;
if this is purely due to firewall then its ok to defer this</comment>
                    <comment id="28246" author="alkondratenko" created="Tue, 29 May 2012 20:45:16 -0500"  >your specific way of using firewall makes this problem probable to observe. That&amp;#39;s my understanding.</comment>
                    <comment id="28248" author="farshid" created="Tue, 29 May 2012 20:56:35 -0500"  >firewall is our way of simulating a node disappearing and re-appearing. we can simulate that by also shutting down the network interface or pulling the network cable if it helps</comment>
                    <comment id="28249" author="alkondratenko" created="Tue, 29 May 2012 21:03:51 -0500"  >I have evidence that you&amp;#39;re enabling firewall back in some very specific way. Particularly memcached traffic is re-enabled first. And then _minutes_ later you re-enable erlang traffic.</comment>
                    <comment id="28354" author="dipti" created="Wed, 30 May 2012 19:22:07 -0500"  >will defer to later release. </comment>
                    <comment id="39183" author="alkondratenko" created="Mon, 17 Sep 2012 13:25:20 -0500"  >Cannot happen on replicator on destination.</comment>
                </comments>
                    <attachments>
                    <attachment id="13209" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.50-diag.txt.gz" size="4901004" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13210" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.51-diag.txt.gz" size="3633181" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13211" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.52-diag.txt.gz" size="1241363" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13212" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.53-diag.txt.gz" size="3475074" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13213" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.54-diag.txt.gz" size="1265921" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13214" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.55-diag.txt.gz" size="1265091" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13208" name="c25ab549-07a1-4980-a8db-c2d0e5d293f1-10.1.3.56-diag.txt.gz" size="3516533" author="karan" created="Mon, 14 May 2012 15:34:40 -0500" />
                    <attachment id="13315" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.50-diag.gz" size="695999" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13321" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.51-diag.gz" size="487149" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13319" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.52-diag.gz" size="379092" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13320" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.53-diag.gz" size="485960" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13318" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.54-diag.gz" size="504312" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13317" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.55-diag.gz" size="377549" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                    <attachment id="13316" name="d7d06fcc-8859-47f3-b307-70cc957336a2-10.1.3.56-diag.gz" size="488920" author="karan" created="Tue, 22 May 2012 00:03:40 -0500" />
                </attachments>
            <subtasks>
        </subtasks>
                <customfields>
                                                                        <customfield id="customfield_10180" key="com.atlassian.jira.ext.charting:firstresponsedate">
                <customfieldname>Date of First Response</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>Mon, 14 May 2012 22:52:30 -0500</customfieldvalue>

                </customfieldvalues>
            </customfield>
                                                                                                                                                                                                            <customfield id="customfield_10081" key="com.pyxis.greenhopper.jira:gh-global-rank">
                <customfieldname>Rank</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>5376</customfieldvalue>
                </customfieldvalues>
            </customfield>
                                                                                                                                                                                        <customfield id="customfield_10181" key="com.atlassian.jira.ext.charting:timeinstatus">
                <customfieldname>Time In Status</customfieldname>
                <customfieldvalues>
                    
                </customfieldvalues>
            </customfield>
                                                                    </customfields>
    </item>
</channel>
</rss>