<!-- 
RSS generated by JIRA (5.2.4#845-sha1:c9f4cc41abe72fb236945343a1f485c2c844dac9) at Wed May 22 09:33:51 CDT 2013

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary add field=key&field=summary to the URL of your request.
For example:
http://www.couchbase.com/issues/si/jira.issueviews:issue-xml/MB-6992/MB-6992.xml?field=key&field=summary
-->
<rss version="0.92" >
<channel>
    <title>Couchbase</title>
    <link>http://www.couchbase.com/issues</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>5.2.4</version>
        <build-number>845</build-number>
        <build-date>26-12-2012</build-date>
    </build-info>

<item>
            <title>[MB-6992] rebalance hangs after failing over disconnected node</title>
                <link>http://www.couchbase.com/issues/browse/MB-6992</link>
                <project id="10010" key="MB">Couchbase Server</project>
                        <description>1 node went down while loading data on 22 node cluster. (possibly related to xen-hypervisor as it could not ping gateway and network interface needed to be restarted)&lt;br/&gt;
While node was down I tried to fail it over and rebalance.&lt;br/&gt;
However, rebalance never completes and looks like there is no rebalance activity occuring on tap.&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
Some activity seen in logs at time of node down:&lt;br/&gt;
&lt;br/&gt;
10.3.3.59 sees  .60 nodedown :&lt;br/&gt;
&lt;br/&gt;
[user:warn,2012-10-22T11:06:38.896,&lt;a href=&apos;mailto:ns_1@10.3.3.59&apos;&gt;ns_1@10.3.3.59&lt;/a&gt;:ns_node_disco:ns_node_disco:handle_info:168]Node &amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.59&apos;&gt;ns_1@10.3.3.59&lt;/a&gt;&amp;#39; saw that node &amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.60&apos;&gt;ns_1@10.3.3.60&lt;/a&gt;&amp;#39; went down.&lt;br/&gt;
&lt;br/&gt;
at the same time stamp node .60 shows:&lt;br/&gt;
&lt;br/&gt;
[ns_server:error,2012-10-22T11:06:00.350,&lt;a href=&apos;mailto:ns_1@10.3.3.60&apos;&gt;ns_1@10.3.3.60&lt;/a&gt;:&amp;lt;0.12281.36&amp;gt;:ns_janitor:cleanup_with_states:84]Bucket &amp;quot;default&amp;quot; not yet ready on [&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.84&apos;&gt;ns_1@10.3.2.84&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2&apos;&gt;ns_1@10.3.2&lt;/a&gt;.&lt;br/&gt;
85&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.110&apos;&gt;ns_1@10.3.2.110&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.111&apos;&gt;ns_1@10.3.2.111&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.112&apos;&gt;ns_1@10.3.2.112&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.113&apos;&gt;ns_1@10.3.2.113&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.114&apos;&gt;ns_1@10.3.2.114&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.115&apos;&gt;ns_1@10.3.2.115&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.59&apos;&gt;ns_1@10.3.3.59&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.62&apos;&gt;ns_1@10.3.3.62&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.66&apos;&gt;ns_1@10.3.3.66&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.69&apos;&gt;ns_1@10.3.3.69&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.70&apos;&gt;ns_1@10.3.3.70&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.121.90&apos;&gt;ns_1@10.3.121.90&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.121.91&apos;&gt;ns_1@10.3.121.91&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.107&apos;&gt;ns_1@10.3.2.107&lt;/a&gt;&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.109&apos;&gt;ns_1@10.3.2.109&lt;/a&gt;&amp;#39;]&lt;br/&gt;
[ns_server:debug,2012-10-22T11:06:07.388,&lt;a href=&apos;mailto:ns_1@10.3.3.60&apos;&gt;ns_1@10.3.3.60&lt;/a&gt;:&amp;lt;0.12508.36&amp;gt;:janitor_agent:new_style_query_vbucket_states_loop:116]Exception from query_vbucket_states of &amp;quot;defau&lt;br/&gt;
lt&amp;quot;:&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.85&apos;&gt;ns_1@10.3.2.85&lt;/a&gt;&amp;#39;&lt;br/&gt;
{&amp;#39;EXIT&amp;#39;,{{nodedown,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.85&apos;&gt;ns_1@10.3.2.85&lt;/a&gt;&amp;#39;},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{gen_server,call,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[{&amp;#39;janitor_agent-default&amp;#39;,&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.85&apos;&gt;ns_1@10.3.2.85&lt;/a&gt;&amp;#39;},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;query_vbucket_states,infinity]}}}&lt;br/&gt;
</description>
                <environment>build 10.3.3.59</environment>
            <key id="20384">MB-6992</key>
            <summary>rebalance hangs after failing over disconnected node</summary>
                <type id="1" iconUrl="http://www.couchbase.com/issues/images/icons/issuetypes/bug.png">Bug</type>
                                <priority id="1" iconUrl="http://www.couchbase.com/issues/images/icons/priorities/blocker.png">Blocker</priority>
                    <status id="6" iconUrl="http://www.couchbase.com/issues/images/icons/statuses/closed.png">Closed</status>
                    <resolution id="1">Fixed</resolution>
                    <security id="10011">Public</security>
                        <assignee username="chiyoung">Chiyoung Seo</assignee>
                                <reporter username="tommie">Tommie McAfee</reporter>
                        <labels>
                        <label>system-test</label>
                    </labels>
                <created>Tue, 23 Oct 2012 15:39:58 -0500</created>
                <updated>Thu, 10 Jan 2013 01:55:22 -0600</updated>
                    <resolved>Fri, 26 Oct 2012 19:18:34 -0500</resolved>
                            <version>2.0</version>
                                <fixVersion>2.0</fixVersion>
                                <component>couchbase-bucket</component>
                <component>ns_server</component>
                                <votes>0</votes>
                        <watches>1</watches>
                                                    <comments>
                    <comment id="42321" author="tommie" created="Tue, 23 Oct 2012 16:14:48 -0500"  >Also, when Jin took a look he noticed modes nodes are at 100% rebalance status, however 10.3.2.112 is still at 63% and found the following CRASH report was  seen on that host.&lt;br/&gt;
&lt;br/&gt;
[couchdb:error,2012-10-21T23:07:11.144,&lt;a href=&apos;mailto:ns_1@127.0.0.1&apos;&gt;ns_1@127.0.0.1&lt;/a&gt;:couch_view:couch_log:error:42]Exit on non-updater process: config_change&lt;br/&gt;
[couchdb:error,2012-10-21T23:07:11.144,&lt;a href=&apos;mailto:ns_1@127.0.0.1&apos;&gt;ns_1@127.0.0.1&lt;/a&gt;:couch_set_view:couch_log:error:42]Exit on non-updater process: config_change&lt;br/&gt;
[error_logger:error,2012-10-21T23:07:11.144,&lt;a href=&apos;mailto:ns_1@127.0.0.1&apos;&gt;ns_1@127.0.0.1&lt;/a&gt;:error_logger:ale_error_logger_handler:log_report:72]&lt;br/&gt;
=========================CRASH REPORT=========================&lt;br/&gt;
&amp;nbsp;&amp;nbsp;crasher:&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;initial call: couch_server:init/1&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;pid: &amp;lt;0.216.0&amp;gt;&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;registered_name: couch_server&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;exception exit: {function_clause,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[{couch_server,&amp;#39;-terminate/2-fun-0-&amp;#39;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[{&amp;lt;&amp;lt;&amp;quot;_replicator&amp;quot;&amp;gt;&amp;gt;,&amp;lt;0.444.0&amp;gt;}]},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{lists,foreach,2},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{gen_server,terminate,6},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{proc_lib,init_p_do_apply,3}]}&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;in function  gen_server:terminate/6&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;ancestors: [couch_primary_services,couch_server_sup,cb_couch_sup,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;ns_server_cluster_sup,&amp;lt;0.60.0&amp;gt;]&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;messages: []&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;links: [&amp;lt;0.230.0&amp;gt;,&amp;lt;0.444.0&amp;gt;,&amp;lt;0.211.0&amp;gt;]&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;dictionary: []&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;trap_exit: true&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;status: running&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;heap_size: 2584&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;stack_size: 24&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;reductions: 4530&lt;br/&gt;
&amp;nbsp;&amp;nbsp;neighbours:</comment>
                    <comment id="42323" author="mikew" created="Tue, 23 Oct 2012 16:22:45 -0500"  >Alk,&lt;br/&gt;
&lt;br/&gt;
Replication building is completed on 10.3.2.112 but ns_server has not killed the tap stream. Please take a look at this and let me know if there is anything else I can look at.&lt;br/&gt;
&lt;br/&gt;
Mike-Wiederholds-MacBook-Pro:ep-engine mikewied$ management/cbstats 10.3.2.112:11210 tap | egrep replication_building&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:ack_log_size:             0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:ack_seqno:                359937&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:ack_window_full:          false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:backfill_completed:       true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:backfill_start_timestamp: 1350926553&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:bg_jobs_completed:        166602&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:bg_jobs_issued:           166602&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:bg_result_size:           0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:connected:                true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:created:                  39985&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:flags:                    85 (ack,backfill,vblist,checkpoints)&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:has_queued_item:          false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:idle:                     true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:paused:                   1&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:pending_backfill:         false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:pending_disconnect:       false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:pending_disk_backfill:    false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:qlen:                     0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:qlen_high_pri:            0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:qlen_low_pri:             0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_backfillremaining:  0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_backoff:            0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_drain:              359877&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_fill:               0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_itemondisk:         0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:queue_memory:             0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:rec_fetched:              193330&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:recv_ack_seqno:           359936&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:reserved:                 1&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:seqno_ack_requested:      359936&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:supports_ack:             true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:suspended:                false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:total_backlog_size:       0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:total_noops:              3963&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:type:                     producer&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:vb_filter:                { 494 }&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.2.108&apos;&gt;ns_1@10.3.2.108&lt;/a&gt;&amp;#39;:vb_filters:               1&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:ack_log_size:              0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:ack_seqno:                 97912&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:ack_window_full:           false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:backfill_completed:        true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:backfill_start_timestamp:  0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:bg_jobs_completed:         0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:bg_jobs_issued:            0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:bg_result_size:            0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:connected:                 true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:created:                   39985&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:flags:                     85 (ack,backfill,vblist,checkpoints)&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:has_queued_item:           false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:idle:                      true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:paused:                    1&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:pending_backfill:          false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:pending_disconnect:        false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:pending_disk_backfill:     false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:qlen:                      0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:qlen_high_pri:             0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:qlen_low_pri:              0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_backfillremaining:   0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_backoff:             0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_drain:               97854&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_fill:                0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_itemondisk:          0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:queue_memory:              0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:rec_fetched:               97909&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:recv_ack_seqno:            97911&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:reserved:                  1&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:seqno_ack_requested:       97911&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:supports_ack:              true&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:suspended:                 false&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:total_backlog_size:        0&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:total_noops:               3964&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:type:                      producer&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:vb_filter:                 { 494 }&lt;br/&gt;
&amp;nbsp;eq_tapq:replication_building_494_&amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;:vb_filters:                1</comment>
                    <comment id="42381" author="tommie" created="Wed, 24 Oct 2012 08:09:20 -0500"  >All logs here:&lt;br/&gt;
&lt;a href=&quot;https://docs.google.com/folder/d/0B48zH0LlqjKrNm9UYlhuNzZjSnM/edit&quot;&gt;https://docs.google.com/folder/d/0B48zH0LlqjKrNm9UYlhuNzZjSnM/edit&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
This behavior was noticed during the 1.8.1 use case testing in 2.0 build 1870&lt;br/&gt;
&lt;a href=&quot;http://hub.internal.couchbase.com/confluence/display/QA/2.0+System+Test+Specs#2.0SystemTestSpecs-SystemTest%3A1.8.1usecase%28PlumWorkloadv1.0%29&quot;&gt;http://hub.internal.couchbase.com/confluence/display/QA/2.0+System+Test+Specs#2.0SystemTestSpecs-SystemTest%3A1.8.1usecase%28PlumWorkloadv1.0%29&lt;/a&gt;</comment>
                    <comment id="42402" author="alkondratenko" created="Wed, 24 Oct 2012 12:22:36 -0500"  >BTW, I don&amp;#39;t have a convenient way to download all logs from google drive.</comment>
                    <comment id="42407" author="alkondratenko" created="Wed, 24 Oct 2012 12:57:27 -0500"  >We&amp;#39;re stuck waiting for checkpoint 67 to be persisted on vbucket 494 on node .65.&lt;br/&gt;
&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{&amp;lt;17848.6247.34&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[{registered_name,[]},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{status,waiting},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{initial_call,{proc_lib,init_p,3}},&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;{backtrace,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;[&amp;lt;&amp;lt;&amp;quot;Program counter: 0x00007f5e10ee9e48 (gen:do_call/4 + 576)&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;CP: 0x0000000000000000 (invalid)&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;arity = 0&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;0x00007f5e0b871858 Return addr 0x00007f5e10f68870 (gen_server:call/3 + 128)&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(0)     #Ref&amp;lt;0.0.50.98207&amp;gt;&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(1)     &amp;#39;&lt;a href=&apos;mailto:ns_1@10.3.3.65&apos;&gt;ns_1@10.3.3.65&lt;/a&gt;&amp;#39;&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;y(2)     []&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(3)     infinity&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(4)     {wait_for_checkpoint_persistence,494,67}&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(5)     &amp;#39;$gen_call&amp;#39;&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;y(6)     &amp;lt;0.2607.0&amp;gt;&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;x00007f5e0b871898 Return addr 0x00007f5e06f9e228 (janitor_agent:do_wait_checkpoint_persist&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(0)     infinity&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(1)     {wait_for_checkpoint_persistence,494,67}&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(2)     &amp;#39;ns_memcached-default&amp;#39;&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;quot;y(3)     Catch 0x00007f5e10f68870 (gen_server:call/3 + 128)&amp;quot;&amp;gt;&amp;gt;,&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;lt;&amp;lt;&amp;gt;&amp;gt;,&lt;br/&gt;
&lt;br/&gt;
(thats janitor_agent child on .65 doing that call)&lt;br/&gt;
&lt;br/&gt;
And stats indicate that it&amp;#39;s actually persisted:&lt;br/&gt;
&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:persisted_checkpoint_id&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;92&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:checkpoint_extension&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;false&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:num_items_for_persistence&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;0&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:num_checkpoints&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;1&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:num_open_checkpoint_items&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;0&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:num_checkpoint_items&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;1&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:num_tap_cursors&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;0&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:last_closed_checkpoint_id&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;92&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
&amp;nbsp;{&amp;lt;&amp;lt;&amp;quot;vb_494:open_checkpoint_id&amp;quot;&amp;gt;&amp;gt;,&amp;lt;&amp;lt;&amp;quot;93&amp;quot;&amp;gt;&amp;gt;},&lt;br/&gt;
</comment>
                    <comment id="42412" author="mikew" created="Wed, 24 Oct 2012 13:33:39 -0500"  >Chiyoung,&lt;br/&gt;
&lt;br/&gt;
This is an issue with the new checkpoint persistence command you added. I think we should add a stat for checkpoint persistence commands in progress. For example a stat that is incremented when we receive a checkpoint persistence request and is decremented when the request completes.</comment>
                    <comment id="42426" author="chiyoung" created="Wed, 24 Oct 2012 15:37:30 -0500"  >I dumped connections stats from memcached layer in 10.3.3.65 and found one connection that is still in ewouldblock state and corresponds to vb_checkpoint_persistence command&lt;br/&gt;
&lt;br/&gt;
STAT conn 0x58cf080&lt;br/&gt;
STAT socket 83&lt;br/&gt;
STAT protocol binary&lt;br/&gt;
STAT transport TCP&lt;br/&gt;
STAT nevents 20&lt;br/&gt;
STAT sasl_conn 0xcbaf5390&lt;br/&gt;
STAT state conn_nread&lt;br/&gt;
STAT substate bin_reading_packet&lt;br/&gt;
STAT registered_in_libevent 0&lt;br/&gt;
STAT ev_flags 12&lt;br/&gt;
STAT which 2&lt;br/&gt;
STAT rbuf 0x58d0000&lt;br/&gt;
STAT rcurr 0x58d0020&lt;br/&gt;
STAT rsize 2048&lt;br/&gt;
STAT rbytes 0&lt;br/&gt;
STAT wbuf 0x58e7800&lt;br/&gt;
STAT wcurr 0x58fb000&lt;br/&gt;
STAT wsize 2048&lt;br/&gt;
STAT wbytes 24&lt;br/&gt;
STAT write_and_go 0x4104f0&lt;br/&gt;
STAT write_and_free (nil)&lt;br/&gt;
STAT ritem 0x58d0020&lt;br/&gt;
STAT rlbytes 0&lt;br/&gt;
STAT item (nil)&lt;br/&gt;
STAT store_op 0&lt;br/&gt;
STAT sbytes 0&lt;br/&gt;
STAT iov 0x58e0800&lt;br/&gt;
STAT iovsize 400&lt;br/&gt;
STAT iovused 0&lt;br/&gt;
STAT msglist 0x58d5440&lt;br/&gt;
STAT msgsize 10&lt;br/&gt;
STAT msgused 1&lt;br/&gt;
STAT msgcurr 0&lt;br/&gt;
STAT msgbytes 0&lt;br/&gt;
STAT ilist 0x58d9100&lt;br/&gt;
STAT isize 200&lt;br/&gt;
STAT icurr 0x58d9100&lt;br/&gt;
STAT ileft 0&lt;br/&gt;
STAT suffixlist 0x58539a0&lt;br/&gt;
STAT suffixsize 20&lt;br/&gt;
STAT suffixcurr 0x58539a0&lt;br/&gt;
STAT suffixleft 0&lt;br/&gt;
STAT noreply 0&lt;br/&gt;
STAT refcount 1&lt;br/&gt;
STAT dynamic_buffer.buffer (nil)&lt;br/&gt;
STAT dynamic_buffer.size 2048&lt;br/&gt;
STAT dynamic_buffer.offset 24&lt;br/&gt;
STAT engine_storage 0xcd6fb0a0&lt;br/&gt;
STAT cas 0&lt;br/&gt;
STAT cmd 177&lt;br/&gt;
STAT opaque 0&lt;br/&gt;
STAT keylen 0&lt;br/&gt;
STAT list_state 0&lt;br/&gt;
STAT next (nil)&lt;br/&gt;
STAT thread 0x10c55f0&lt;br/&gt;
STAT aiostat 0&lt;br/&gt;
STAT ewouldblock 1&lt;br/&gt;
STAT tap_iterator (nil)&lt;br/&gt;
&lt;br/&gt;
I&amp;#39;m further debugging it now.&lt;br/&gt;
</comment>
                    <comment id="42456" author="chiyoung" created="Wed, 24 Oct 2012 18:49:59 -0500"  >Tommie,&lt;br/&gt;
&lt;br/&gt;
As we saw, the rebalance out 10.3.3.65 was successful. While debugging this issue, I had some issues in .65 while doing GETs for non-resident items, which puts my connection in ewouldblock state in memcached layer. I will continue to debug this issue.&lt;br/&gt;
&lt;br/&gt;
Please update the bug if you see the same rebalance hung issue again.</comment>
                    <comment id="42577" author="thuan" created="Fri, 26 Oct 2012 04:52:02 -0500"  >Integrated in github-ep-engine-2-0 #451 (See [&lt;a href=&quot;http://qa.hq.northscale.net/job/github-ep-engine-2-0/451/&quot;&gt;http://qa.hq.northscale.net/job/github-ep-engine-2-0/451/&lt;/a&gt;])&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;a href=&quot;http://www.couchbase.com/issues/browse/MB-6992&quot; title=&quot;rebalance hangs after failing over disconnected node&quot;&gt;&lt;strike&gt;MB-6992&lt;/strike&gt;&lt;/a&gt; Add more informative logs to checkpoint prioritization (Revision 3c719d47ca41285bbcbc61817f719180448f1042)&lt;br/&gt;
&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;Result = SUCCESS&lt;br/&gt;
Chiyoung Seo : &lt;br/&gt;
Files : &lt;br/&gt;
* src/ep.cc&lt;br/&gt;
</comment>
                    <comment id="42668" author="chiyoung" created="Fri, 26 Oct 2012 19:18:34 -0500"  >&lt;a href=&quot;http://review.couchbase.org/#/c/22022/&quot;&gt;http://review.couchbase.org/#/c/22022/&lt;/a&gt;</comment>
                    <comment id="42676" author="thuan" created="Fri, 26 Oct 2012 20:37:35 -0500"  >Integrated in github-ep-engine-2-0 #452 (See [&lt;a href=&quot;http://qa.hq.northscale.net/job/github-ep-engine-2-0/452/&quot;&gt;http://qa.hq.northscale.net/job/github-ep-engine-2-0/452/&lt;/a&gt;])&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;a href=&quot;http://www.couchbase.com/issues/browse/MB-6992&quot; title=&quot;rebalance hangs after failing over disconnected node&quot;&gt;&lt;strike&gt;MB-6992&lt;/strike&gt;&lt;/a&gt; Control the flusher execution by the transaction size (Revision b327be09a1f971145fda5c249b4fa7a8304b1920)&lt;br/&gt;
&lt;br/&gt;
&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;Result = SUCCESS&lt;br/&gt;
Chiyoung Seo : &lt;br/&gt;
Files : &lt;br/&gt;
* tests/ep_testsuite.cc&lt;br/&gt;
* src/ep.cc&lt;br/&gt;
* src/ep.hh&lt;br/&gt;
* src/flusher.hh&lt;br/&gt;
* src/flusher.cc&lt;br/&gt;
</comment>
                </comments>
                    <attachments>
                    <attachment id="15528" name="10.3.3.59.debug.tar.gz" size="4074514" author="tommie" created="Tue, 23 Oct 2012 15:39:58 -0500" />
                    <attachment id="15529" name="10.3.3.60.debug.tar.gz" size="849706" author="tommie" created="Tue, 23 Oct 2012 15:39:58 -0500" />
                </attachments>
            <subtasks>
        </subtasks>
                <customfields>
                                                                        <customfield id="customfield_10180" key="com.atlassian.jira.ext.charting:firstresponsedate">
                <customfieldname>Date of First Response</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>Tue, 23 Oct 2012 16:22:45 -0500</customfieldvalue>

                </customfieldvalues>
            </customfield>
                                                                                                                                                                                                            <customfield id="customfield_10081" key="com.pyxis.greenhopper.jira:gh-global-rank">
                <customfieldname>Rank</customfieldname>
                <customfieldvalues>
                    <customfieldvalue>3685</customfieldvalue>
                </customfieldvalues>
            </customfield>
                                                                                                                                                                                        <customfield id="customfield_10181" key="com.atlassian.jira.ext.charting:timeinstatus">
                <customfieldname>Time In Status</customfieldname>
                <customfieldvalues>
                    
                </customfieldvalues>
            </customfield>
                                                </customfields>
    </item>
</channel>
</rss>