<!-- 
RSS generated by JIRA (5.2.4#845-sha1:c9f4cc41abe72fb236945343a1f485c2c844dac9) at Fri May 24 10:44:36 CDT 2013

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary add field=key&field=summary to the URL of your request.
For example:
http://www.couchbase.com/issues/si/jira.issueviews:issue-xml/MB-6706/MB-6706.xml?field=key&field=summary
-->
<rss version="0.92" >
<channel>
    <title>Couchbase</title>
    <link>http://www.couchbase.com/issues</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>5.2.4</version>
        <build-number>845</build-number>
        <build-date>26-12-2012</build-date>
    </build-info>

<item>
            <title>[MB-6706] [system test] rebalance hang when add nodes to cluster</title>
                <link>http://www.couchbase.com/issues/browse/MB-6706</link>
                <project id="10010" key="MB">Couchbase Server</project>
                        <description>Cluster information:&lt;br/&gt;
- 8 centos 6.2 64bit server with 4 cores CPU&lt;br/&gt;
- Each server has 32 GB RAM and 400 GB SSD disk.&lt;br/&gt;
- SSD disk format ext4 on /data&lt;br/&gt;
- Each server has its own drive, no disk sharing with other server.&lt;br/&gt;
- Load 15 million items to both buckets&lt;br/&gt;
- Cluster has 2 buckets, default (11GB) and saslbucket (11GB) with consistent view enable.  For 2 buckets, we use only 68% total RAM of system.&lt;br/&gt;
- Each bucket has one doc and 2 views for each doc (default d1 and saslbucket d11)&lt;br/&gt;
&lt;br/&gt;
* Create cluster with 4 nodes installed couchbase server 2.0.0-1746&lt;br/&gt;
&lt;br/&gt;
10.6.2.37&lt;br/&gt;
10.6.2.38&lt;br/&gt;
10.6.2.39&lt;br/&gt;
10.6.2.40&lt;br/&gt;
&lt;br/&gt;
* Data path /data&lt;br/&gt;
* View path /data &lt;br/&gt;
&lt;br/&gt;
* Add 4 nodes to cluster and rebalance&lt;br/&gt;
10.6.2.42&lt;br/&gt;
10.6.2.43&lt;br/&gt;
10.6.2.44&lt;br/&gt;
10.6.2.45&lt;br/&gt;
&lt;br/&gt;
* rebalance hang&lt;br/&gt;
&lt;br/&gt;
* Link to collect info of all nodes  &lt;a href=&quot;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201209/8nodes-col-info-1746-reb-hang-20120920.tgz&quot;&gt;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201209/8nodes-col-info-1746-reb-hang-20120920.tgz&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
Link to atop file of all nodes  &lt;a href=&quot;https://s3.amazonaws.com/packages.couchbase/atop-files/orange/201209/atop-8nodes-1746-reb-hang-20120920.tgz&quot;&gt;https://s3.amazonaws.com/packages.couchbase/atop-files/orange/201209/atop-8nodes-1746-reb-hang-20120920.tgz&lt;/a&gt;</description>
                <environment>centos 6.2 64bit build 2.0.0-1746</environment>
            <key id="19856">MB-6706</key>
            <summary>[system test] rebalance hang when add nodes to cluster</summary>
                <type id="1" iconUrl="http://www.couchbase.com/issues/images/icons/issuetypes/bug.png">Bug</type>
                                <priority id="1" iconUrl="http://www.couchbase.com/issues/images/icons/priorities/blocker.png">Blocker</priority>
                    <status id="6" iconUrl="http://www.couchbase.com/issues/images/icons/statuses/closed.png">Closed</status>
                    <resolution id="1">Fixed</resolution>
                    <security id="10011">Public</security>
                        <assignee username="FilipeManana">Filipe Manana</assignee>
                                <reporter username="thuan">Thuan Nguyen</reporter>
                        <labels>
                        <label>system-test</label>
                    </labels>
                <created>Thu, 20 Sep 2012 20:58:58 -0500</created>
                <updated>Thu, 10 Jan 2013 01:21:35 -0600</updated>
                    <resolved>Wed, 3 Oct 2012 13:36:47 -0500</resolved>
                            <version>2.0</version>
                                <fixVersion>2.0</fixVersion>
                                <component>ns_server</component>
                                <votes>0</votes>
                        <watches>0</watches>
                                                    <comments>
                    <comment id="39484" author="thuan" created="Fri, 21 Sep 2012 09:03:07 -0500"  >I think this bug the same as bug &lt;a href=&quot;http://www.couchbase.com/issues/browse/MB-6707&quot; title=&quot;[system test] rebalance does not stop when click on &amp;quot;Stop Rebalance&amp;quot; button&quot;&gt;&lt;strike&gt;MB-6707&lt;/strike&gt;&lt;/a&gt;</comment>
                    <comment id="39521" author="alkondratenko" created="Mon, 24 Sep 2012 01:46:17 -0500"  >Filipe, there are no crashes and you can see in logs of .38 that we&amp;#39;re waiting for index update (there&amp;#39;s just 1 simple index) and this does not happen.&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
[ns_server:debug,2012-09-20T17:20:30.431,&lt;a href=&apos;mailto:ns_1@10.6.2.38&apos;&gt;ns_1@10.6.2.38&lt;/a&gt;:&amp;lt;0.21339.32&amp;gt;:capi_set_view_manager:do_wait_index_updated:596]References to wait: [#Ref&amp;lt;0.0.309.194865&amp;gt;] (&amp;quot;saslbucket&amp;quot;, 531)&lt;br/&gt;
&lt;br/&gt;
I advise you to take a quick look at source of do_wait_index_updated in capi_set_view_manager. Maybe you will spot something that I&amp;#39;m not doing right.</comment>
                    <comment id="39895" author="thuan" created="Thu, 27 Sep 2012 18:07:51 -0500"  >Hit this bug again in build 2.0.0-1777 with swap rebalance   Add node 44, 45 and remove node 39, 40&lt;br/&gt;
Rebalance hang after moving some items to new added nodes&lt;br/&gt;
&lt;br/&gt;
Cluster information:&lt;br/&gt;
- 8 centos 6.2 64bit server with 4 cores CPU&lt;br/&gt;
- Each server has 32 GB RAM and 400 GB SSD disk.&lt;br/&gt;
- 24.8 GB RAM for couchbase server at each node &lt;br/&gt;
- SSD disk format ext4 on /data&lt;br/&gt;
- Each server has its own SSD drive, no disk sharing with other server.&lt;br/&gt;
- Create cluster with 6 nodes installed couchbase server 2.0.0-1777&lt;br/&gt;
- Cluster has 2 buckets, default (12GB) and saslbucket (12GB).&lt;br/&gt;
- Each bucket has one doc and 2 views for each doc (default d1 and saslbucket d11)&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
10.6.2.37&lt;br/&gt;
10.6.2.38&lt;br/&gt;
10.6.2.39&lt;br/&gt;
10.6.2.40&lt;br/&gt;
10.6.2.42&lt;br/&gt;
10.6.2.43&lt;br/&gt;
&lt;br/&gt;
* Load 18 million items to both bucket. Each key has size from 512 bytes to 1024 bytes &lt;br/&gt;
* Queries all 4 views from 2 docs&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
10.6.2.44&lt;br/&gt;
10.6.2.45&lt;br/&gt;
&lt;br/&gt;
* Data path /data&lt;br/&gt;
* View path /data&lt;br/&gt;
&lt;br/&gt;
Link to collect info of all nodes &lt;a href=&quot;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201209/8nodes-col-info-1777-swap-reb-hang-20120927-155552.tgz&quot;&gt;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201209/8nodes-col-info-1777-swap-reb-hang-20120927-155552.tgz&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
Link to atop of all nodes  &lt;a href=&quot;https://s3.amazonaws.com/packages.couchbase/atop-files/orange/201209/atop-8nodes-1777-swap-reb-hang-20120927-155750.tgz&quot;&gt;https://s3.amazonaws.com/packages.couchbase/atop-files/orange/201209/atop-8nodes-1777-swap-reb-hang-20120927-155750.tgz&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
</comment>
                    <comment id="40151" author="thuan" created="Tue, 2 Oct 2012 13:36:04 -0500"  >Hit this bug again in build 2.0.0-1781 in system test. &lt;br/&gt;
&lt;br/&gt;
* Add 2 nodes: 39 and 40 and rebalance. During rebalance, reboot node 42 and 43. Rebalance failed as expected.&lt;br/&gt;
* After node finished warmup, rebalance again. Rebalance failed with bug &lt;a href=&quot;http://www.couchbase.com/issues/browse/MB-6490&quot; title=&quot;Rebalance failed with reason &amp;quot;Partition 687 not in active nor passive set&amp;quot; in add in node rebalance&quot;&gt;&lt;strike&gt;MB-6490&lt;/strike&gt;&lt;/a&gt; on node 44.&lt;br/&gt;
* Failover node 44 and rebalance.&lt;br/&gt;
* Cluster rebalance saslbucket first.  Rebalance was done after 17 hrs  &lt;br/&gt;
&lt;br/&gt;
Started rebalancing bucket saslbucket	ns_rebalancer000	&lt;a href=&apos;mailto:ns_1@10.6.2.37&apos;&gt;ns_1@10.6.2.37&lt;/a&gt;	14:44:27 - Mon Oct 1, 2012&lt;br/&gt;
Started rebalancing bucket default	ns_rebalancer000	&lt;a href=&apos;mailto:ns_1@10.6.2.37&apos;&gt;ns_1@10.6.2.37&lt;/a&gt;	08:14:08 - Tue Oct 2, 2012&lt;br/&gt;
&lt;br/&gt;
** Rebalance of default bucket hang around 10:00AM Tue Oct 2, 2012 as in capture screen&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
Cluster information:&lt;br/&gt;
- 8 centos 6.2 64bit server with 4 cores CPU&lt;br/&gt;
- Each server has 32 GB RAM and 400 GB SSD disk.&lt;br/&gt;
- 24.8 GB RAM for couchbase server at each node&lt;br/&gt;
- SSD disk format ext4 on /data&lt;br/&gt;
- Each server has its own SSD drive, no disk sharing with other server.&lt;br/&gt;
- Create cluster with 6 nodes installed couchbase server 2.0.0-1781&lt;br/&gt;
- Cluster has 2 buckets, default (12GB) and saslbucket (12GB).&lt;br/&gt;
- Each bucket has one doc and 2 views for each doc (default d1 and saslbucket d11)&lt;br/&gt;
- Enable consistent view on cluster (by default)&lt;br/&gt;
&lt;br/&gt;
10.6.2.37&lt;br/&gt;
10.6.2.38&lt;br/&gt;
10.6.2.44&lt;br/&gt;
10.6.2.45&lt;br/&gt;
10.6.2.42&lt;br/&gt;
10.6.2.43&lt;br/&gt;
&lt;br/&gt;
* Load 14 million items to each bucket. Each key has size from 512 bytes to 1024 bytes&lt;br/&gt;
* Mutate 14 million items to each bucket with size of each key from 1024 to 1500 bytes&lt;br/&gt;
* Load running about 8K to 10K ops on both buckets&lt;br/&gt;
* Queries all 4 views from 2 docs&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
10.6.2.39&lt;br/&gt;
10.6.2.40&lt;br/&gt;
&lt;br/&gt;
* Data path /data&lt;br/&gt;
* View path /data&lt;br/&gt;
&lt;br/&gt;
Manifest info from build 1781&lt;br/&gt;
&lt;a href=&quot;http://builds.hq.northscale.net/latestbuilds/couchbase-server-enterprise_x86_64_2.0.0-1781-rel.rpm.manifest.xml&quot;&gt;http://builds.hq.northscale.net/latestbuilds/couchbase-server-enterprise_x86_64_2.0.0-1781-rel.rpm.manifest.xml&lt;/a&gt; &lt;br/&gt;
&lt;br/&gt;
Link to collect info of all nodes &lt;a href=&quot;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201210/8nodes-col-info-1781-rebalance-hang-20121002-114333.tgz&quot;&gt;https://s3.amazonaws.com/packages.couchbase/collect_info/orange/2_0_0/201210/8nodes-col-info-1781-rebalance-hang-20121002-114333.tgz&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
Link to tap stats from all nodes  &lt;a href=&quot;https://friendpaste.com/6JqjtMOwZLvmlx5h9fxt6L&quot;&gt;https://friendpaste.com/6JqjtMOwZLvmlx5h9fxt6L&lt;/a&gt;&lt;br/&gt;
</comment>
                    <comment id="40152" author="thuan" created="Tue, 2 Oct 2012 13:37:37 -0500"  >Promote it to blocker since we hit it often in system test.</comment>
                    <comment id="40181" author="thuan" created="Tue, 2 Oct 2012 19:52:35 -0500"  >I killed loads on default bucket (currently rebalancing but hang), rebalance started after five minutes all loads stopped.  Few minutes later, restart half loads on default bucket, rebalance continues running </comment>
                    <comment id="40234" author="thuan" created="Wed, 3 Oct 2012 15:55:30 -0500"  >Integrated in github-couchdb-preview #509 (See [&lt;a href=&quot;http://qa.hq.northscale.net/job/github-couchdb-preview/509/&quot;&gt;http://qa.hq.northscale.net/job/github-couchdb-preview/509/&lt;/a&gt;])&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;a href=&quot;http://www.couchbase.com/issues/browse/MB-6706&quot; title=&quot;[system test] rebalance hang when add nodes to cluster&quot;&gt;&lt;strike&gt;MB-6706&lt;/strike&gt;&lt;/a&gt; Trigger update after defining indexable partitions (Revision 9098ff069968247556da72a2be1bbfd944b1d30e)&lt;br/&gt;
&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;Result = SUCCESS&lt;br/&gt;
pwansch : &lt;br/&gt;
Files : &lt;br/&gt;
* src/couch_set_view/src/couch_set_view_group.erl&lt;br/&gt;
</comment>
                </comments>
                    <attachments>
                    <attachment id="15188" name="ss_2012-09-27_at_4.02.17 PM.png" size="88272" author="thuan" created="Thu, 27 Sep 2012 18:08:23 -0500" />
                    <attachment id="15241" name="ss_2012-10-02_at_11.33.33 AM.png" size="63912" author="thuan" created="Tue, 2 Oct 2012 13:36:31 -0500" />
                </attachments>
            <subtasks>
        </subtasks>
                <customfields>
                                                                        <customfield id="customfield_10180" key="com.atlassian.jira.ext.charting:firstresponsedate">
                <customfieldname>Date of First Response</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>Mon, 24 Sep 2012 01:46:17 -0500</customfieldvalue>

                </customfieldvalues>
            </customfield>
                                                                                                                                                                                                            <customfield id="customfield_10081" key="com.pyxis.greenhopper.jira:gh-global-rank">
                <customfieldname>Rank</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>3923</customfieldvalue>
                </customfieldvalues>
            </customfield>
                                                                                                                                                                                        <customfield id="customfield_10181" key="com.atlassian.jira.ext.charting:timeinstatus">
                <customfieldname>Time In Status</customfieldname>
                <customfieldvalues>
                    
                </customfieldvalues>
            </customfield>
                                                </customfields>
    </item>
</channel>
</rss>