<!-- 
RSS generated by JIRA (8.20.10#820010-sha1:ace47f9899e9ee25d7157d59aa17ab06aee30d3d) at Wed Feb 07 19:56:15 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>OpenDaylight JIRA</title>
    <link>https://jira.opendaylight.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>8.20.10</version>
        <build-number>820010</build-number>
        <build-date>22-06-2022</build-date>
    </build-info>


<item>
            <title>[CONTROLLER-1713] RequestTimeoutException after remove-shard-replica with &quot;transferred leadership to null&quot;</title>
                <link>https://jira.opendaylight.org/browse/CONTROLLER-1713</link>
                <project id="10113" key="CONTROLLER">controller</project>
                    <description>&lt;p&gt;Seen &lt;span class=&quot;error&quot;&gt;&amp;#91;0&amp;#93;&lt;/span&gt; on RelEng first time with module-based shard (tell-based protocol).&lt;br/&gt;
Member-3 was the old leader, member-2 became new leader.&lt;/p&gt;

&lt;p&gt;This is similar to &lt;a href=&quot;https://jira.opendaylight.org/browse/CONTROLLER-1693&quot; title=&quot;UnreachableMember during remove-shard-replica prevents new leader to get elected&quot; class=&quot;issue-link&quot; data-issue-key=&quot;CONTROLLER-1693&quot;&gt;&lt;del&gt;CONTROLLER-1693&lt;/del&gt;&lt;/a&gt; in that member-2 has seen UnreachableMember after remove-shard-replica.&lt;br/&gt;
This is also similar to &lt;a href=&quot;https://jira.opendaylight.org/browse/CONTROLLER-1705&quot; title=&quot;Client on a follower prefix-based shard sometimes does not reconnect when the previous leader is isolated&quot; class=&quot;issue-link&quot; data-issue-key=&quot;CONTROLLER-1705&quot;&gt;&lt;del&gt;CONTROLLER-1705&lt;/del&gt;&lt;/a&gt; in that the client (at member-3) has not properly reconnected to the new leader.&lt;/p&gt;

&lt;p&gt;The quoted part of the title is seen in member-3 karaf.log &lt;span class=&quot;error&quot;&gt;&amp;#91;1&amp;#93;&lt;/span&gt;:&lt;br/&gt;
2017-06-08 07:26:38,108 | INFO  | lt-dispatcher-29 | aftActorLeadershipTransferCohort | 193 - org.opendaylight.controller.sal-akka-raft - 1.5.1.Carbon | member-3-shard-default-config: Successfully transferred leadership to null in 3.074 s&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;0&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/736/log.html.gz#s1-s20-t1-k2-k9&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/736/log.html.gz#s1-s20-t1-k2-k9&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;1&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/736/odl3_karaf.log.gz&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/736/odl3_karaf.log.gz&lt;/a&gt;&lt;/p&gt;</description>
                <environment>&lt;p&gt;Operating System: All&lt;br/&gt;
Platform: All&lt;/p&gt;</environment>
        <key id="26267">CONTROLLER-1713</key>
            <summary>RequestTimeoutException after remove-shard-replica with &quot;transferred leadership to null&quot;</summary>
                <type id="10104" iconUrl="https://jira.opendaylight.org/secure/viewavatar?size=xsmall&amp;avatarId=10303&amp;avatarType=issuetype">Bug</type>
                                                <status id="10004" iconUrl="https://jira.opendaylight.org/images/icons/status_generic.gif" description="">Verified</status>
                    <statusCategory id="3" key="done" colorName="green"/>
                                    <resolution id="10000">Done</resolution>
                                        <assignee username="rovarga">Robert Varga</assignee>
                                    <reporter username="vrpolak">Vratko Polak</reporter>
                        <labels>
                    </labels>
                <created>Thu, 8 Jun 2017 15:38:45 +0000</created>
                <updated>Tue, 25 Jul 2023 08:24:42 +0000</updated>
                            <resolved>Wed, 13 Sep 2017 08:30:41 +0000</resolved>
                                                                    <component>clustering</component>
                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                                                                <comments>
                            <comment id="52401" author="vrpolak" created="Mon, 12 Jun 2017 12:29:40 +0000"  >&lt;p&gt;Something similar happened &lt;span class=&quot;error&quot;&gt;&amp;#91;2&amp;#93;&lt;/span&gt; again. Karaf.log &lt;span class=&quot;error&quot;&gt;&amp;#91;3&amp;#93;&lt;/span&gt; contains the quoted part, but there are other suspicious lines, so I am not really sure this is the same Bug.&lt;/p&gt;

&lt;p&gt;2017-06-11 11:53:06,783 | INFO  | rd-dispatcher-38 | aftActorLeadershipTransferCohort | 193 - org.opendaylight.controller.sal-akka-raft - 1.5.1.Carbon | member-1-shard-default-config: Successfully transferred leadership to null in 2.319 s&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;2&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/739/log.html.gz#s1-s36-t3-k2-k14&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/739/log.html.gz#s1-s36-t3-k2-k14&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;3&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/739/odl1_karaf.log.gz&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-only-carbon/739/odl1_karaf.log.gz&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="52402" author="vrpolak" created="Thu, 7 Sep 2017 11:15:55 +0000"  >&lt;p&gt;Examining history of &lt;del&gt;all&lt;/del&gt; job, I have found more recent (2017-08-24) occurrence &lt;span class=&quot;error&quot;&gt;&amp;#91;4&amp;#93;&lt;/span&gt;.&lt;/p&gt;

&lt;p&gt;After comparing karaf logs, I think this has to do with frontend reconnect happening while there is a member in PreLeader state.&lt;/p&gt;

&lt;p&gt;First, let me copy INFO logs (copied from &lt;span class=&quot;error&quot;&gt;&amp;#91;5&amp;#93;&lt;/span&gt;) from a run where the test passed. The log belongs to member-1 (the old leader), the new leader is member-2. It is not clear from INFO level which member-1 component has first become aware that member-2 is a leader to allow successful reconnect (09:14:33,018), as member-1 Shard switched from Leader to Follower only after seeing (09:14:34,006) higher term from the other follower (member-3) AppendEntriesReply. This probably implies there was a time interval when both member-2 and member-1 claimed to be a Leader.&lt;/p&gt;

&lt;p&gt;2017-09-05 09:14:32,878 | INFO  | qtp481975108-122 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Removing replica for shard default memberName member-1, datastoreType Config&lt;br/&gt;
2017-09-05 09:14:32,896 | INFO  | ult-dispatcher-2 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Successfully removed replica for shard default&lt;br/&gt;
2017-09-05 09:14:32,906 | INFO  | rd-dispatcher-40 | tActorServerConfigurationSupport | 174 - org.opendaylight.controller.sal-akka-raft - 1.5.2.Carbon | member-1-shard-default-config: ServerConfigurationPayload [serverConfig=[ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-3-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;, ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-2-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;]] has been successfully replicated to a majority of followers&lt;br/&gt;
2017-09-05 09:14:32,917 | INFO  | rd-dispatcher-39 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-1-shard-default-config, leaderId=null, leaderPayloadVersion=5&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-09-05 09:14:32,943 | INFO  | lt-dispatcher-21 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: connection ConnectedClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} indicated no leadership, reconnecting it&lt;br/&gt;
org.opendaylight.controller.cluster.access.commands.NotLeaderException: Actor Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt; is not the current leader&lt;br/&gt;
2017-09-05 09:14:32,960 | INFO  | lt-dispatcher-21 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: connection ConnectedClientConnection{client=ClientIdentifier{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} reconnecting as ReconnectingClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}}&lt;br/&gt;
2017-09-05 09:14:32,960 | INFO  | lt-dispatcher-21 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: refreshing backend for shard 0&lt;br/&gt;
2017-09-05 09:14:32,996 | INFO  | lt-dispatcher-41 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: resolved shard 0 to ShardBackendInfo{actor=Actor[akka.tcp://opendaylight-cluster-data@10.29.15.180:2550/user/shardmanager-config/member-2-shard-default-config#-754756015], sessionId=2, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=absent}&lt;br/&gt;
2017-09-05 09:14:32,996 | INFO  | lt-dispatcher-41 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: resolving connection ReconnectingClientConnection{client=ClientIdentifier{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} to ConnectedClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;span class=&quot;error&quot;&gt;&amp;#91;akka.tcp://opendaylight-cluster-data@10.29.15.180:2550/user/shardmanager-config/member-2-shard-default-config#-754756015&amp;#93;&lt;/span&gt;, sessionId=2, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=absent}}&lt;br/&gt;
2017-09-05 09:14:33,018 | INFO  | lt-dispatcher-41 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: replaced connection ReconnectingClientConnection{client=ClientIdentifier{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#-543839374&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#-543839374&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} with ConnectedClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;span class=&quot;error&quot;&gt;&amp;#91;akka.tcp://opendaylight-cluster-data@10.29.15.180:2550/user/shardmanager-config/member-2-shard-default-config#-754756015&amp;#93;&lt;/span&gt;, sessionId=2, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=absent}} in 21.22 ms&lt;br/&gt;
2017-09-05 09:14:34,006 | INFO  | rd-dispatcher-39 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-1-shard-default-config (Leader): Term 2 in &quot;AppendEntriesReply &lt;span class=&quot;error&quot;&gt;&amp;#91;term=2, success=false, followerId=member-3-shard-default-config, logLastIndex=12193, logLastTerm=2, forceInstallSnapshot=false, payloadVersion=5, raftVersion=3&amp;#93;&lt;/span&gt;&quot; message is greater than leader&apos;s term 1 - switching to Follower&lt;br/&gt;
2017-09-05 09:14:34,007 | INFO  | rd-dispatcher-39 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-1-shard-default-config (Leader) :- Switching from behavior Leader to Follower, election term: 2&lt;br/&gt;
2017-09-05 09:14:34,008 | INFO  | lt-dispatcher-22 | RoleChangeNotifier               | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | RoleChangeNotifier for member-1-shard-default-config , received role change from Leader to Follower&lt;br/&gt;
2017-09-05 09:14:34,008 | INFO  | rd-dispatcher-54 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-1-shard-default-config, leaderId=null, leaderPayloadVersion=-1&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-09-05 09:14:34,008 | INFO  | rd-dispatcher-54 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received role changed for member-1-shard-default-config from Leader to Follower&lt;br/&gt;
2017-09-05 09:14:34,969 | INFO  | rd-dispatcher-37 | aftActorLeadershipTransferCohort | 174 - org.opendaylight.controller.sal-akka-raft - 1.5.2.Carbon | member-1-shard-default-config: Successfully transferred leadership to null in 2.052 s&lt;br/&gt;
&lt;br/&gt;
&lt;br/&gt;
Now, when this Bug happens, the old leader (member-1) INFO messages (copied from karaf log &lt;span class=&quot;error&quot;&gt;&amp;#91;6&amp;#93;&lt;/span&gt;) are nearly the same, except the unknown component never learns who the new leader (member-3) is, frontend keeps trying to connect to member-1 and never succeeds.&lt;br/&gt;
&lt;br/&gt;
2017-08-24 15:24:13,620 | INFO  | qtp412422320-101 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Removing replica for shard default memberName member-1, datastoreType Config&lt;br/&gt;
2017-08-24 15:24:13,654 | INFO  | lt-dispatcher-26 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Successfully removed replica for shard default&lt;br/&gt;
2017-08-24 15:24:13,670 | INFO  | rd-dispatcher-53 | tActorServerConfigurationSupport | 174 - org.opendaylight.controller.sal-akka-raft - 1.5.2.Carbon | member-1-shard-default-config: ServerConfigurationPayload [serverConfig=[ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-3-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;, ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-2-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;]] has been successfully replicated to a majority of followers&lt;br/&gt;
2017-08-24 15:24:13,681 | INFO  | rd-dispatcher-37 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-1-shard-default-config, leaderId=null, leaderPayloadVersion=5&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-08-24 15:24:13,684 | INFO  | lt-dispatcher-25 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: connection ConnectedClientConnection{client=ClientIdentifier{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#513397858&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#513397858&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} indicated no leadership, reconnecting it&lt;br/&gt;
org.opendaylight.controller.cluster.access.commands.NotLeaderException: Actor Actor&lt;a href=&quot;#513397858&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#513397858&lt;/a&gt; is not the current leader&lt;br/&gt;
2017-08-24 15:24:13,691 | INFO  | lt-dispatcher-25 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: connection ConnectedClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#513397858&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#513397858&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} reconnecting as ReconnectingClientConnection{client=ClientIdentifier{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#513397858&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#513397858&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}}&lt;br/&gt;
2017-08-24 15:24:13,691 | INFO  | lt-dispatcher-25 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: refreshing backend for shard 0&lt;br/&gt;
2017-08-24 15:24:13,744 | INFO  | rd-dispatcher-53 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-1-shard-default-config: not currently leader, rejecting request ConnectClientRequest{target=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, sequence=0, replyTo=Actor&lt;span class=&quot;error&quot;&gt;&amp;#91;akka://opendaylight-cluster-data/temp/$q&amp;#93;&lt;/span&gt;, minVersion=BORON, maxVersion=BORON}. isLeader: true, isLeaderActive: false,isLeadershipTransferInProgress: true.&lt;br/&gt;
2017-08-24 15:24:13,748 | WARN  | monPool-worker-3 | AbstractShardBackendResolver     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | Failed to resolve shard&lt;br/&gt;
java.util.concurrent.TimeoutException: Connection attempt failed&lt;/p&gt;


&lt;p&gt;Here is karaf log &lt;span class=&quot;error&quot;&gt;&amp;#91;7&amp;#93;&lt;/span&gt; segment from the new leader (member-3) showing transient PreLeader state.&lt;/p&gt;

&lt;p&gt;2017-08-24 15:24:13,680 | INFO  | rd-dispatcher-31 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-3-shard-default-config, leaderId=null, leaderPayloadVersion=5&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-08-24 15:24:13,700 | INFO  | rd-dispatcher-29 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (Candidate): Starting new election term 2&lt;br/&gt;
2017-08-24 15:24:13,700 | INFO  | rd-dispatcher-29 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (Follower) :- Switching from behavior Follower to Candidate, election term: 2&lt;br/&gt;
2017-08-24 15:24:13,701 | INFO  | lt-dispatcher-21 | RoleChangeNotifier               | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | RoleChangeNotifier for member-3-shard-default-config , received role change from Follower to Candidate&lt;br/&gt;
2017-08-24 15:24:13,701 | INFO  | rd-dispatcher-33 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-3-shard-default-config, leaderId=null, leaderPayloadVersion=-1&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-08-24 15:24:13,701 | INFO  | rd-dispatcher-33 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received role changed for member-3-shard-default-config from Follower to Candidate&lt;br/&gt;
2017-08-24 15:24:13,789 | INFO  | rd-dispatcher-29 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (Candidate): LastApplied index 10366 is behind last index 10376 - switching to PreLeader&lt;br/&gt;
2017-08-24 15:24:13,795 | INFO  | rd-dispatcher-29 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (Candidate) :- Switching from behavior Candidate to PreLeader, election term: 2&lt;br/&gt;
2017-08-24 15:24:13,813 | INFO  | rd-dispatcher-32 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-3-shard-default-config, leaderId=member-3-shard-default-config, leaderPayloadVersion=5&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-08-24 15:24:13,816 | INFO  | lt-dispatcher-20 | RoleChangeNotifier               | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | RoleChangeNotifier for member-3-shard-default-config , received role change from Candidate to PreLeader&lt;br/&gt;
2017-08-24 15:24:13,817 | INFO  | rd-dispatcher-32 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received role changed for member-3-shard-default-config from Candidate to PreLeader&lt;br/&gt;
2017-08-24 15:24:13,838 | INFO  | rd-dispatcher-31 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (PreLeader) :- Switching from behavior PreLeader to Leader, election term: 2&lt;br/&gt;
2017-08-24 15:24:13,839 | INFO  | lt-dispatcher-43 | RoleChangeNotifier               | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | RoleChangeNotifier for member-3-shard-default-config , received role change from PreLeader to Leader&lt;br/&gt;
2017-08-24 15:24:13,839 | INFO  | rd-dispatcher-32 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received role changed for member-3-shard-default-config from PreLeader to Leader&lt;br/&gt;
2017-08-24 15:24:13,840 | INFO  | rd-dispatcher-32 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: All Shards are ready - data store config is ready, available count is 0&lt;br/&gt;
2017-08-24 15:24:14,714 | INFO  | rd-dispatcher-32 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | member-3-shard-default-config (Leader): Cannot append entries because sender&apos;s term 1 is less than 2&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;4&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/log.html.gz#s1-s20-t1-k2-k10-k2-k1&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/log.html.gz#s1-s20-t1-k2-k10-k2-k1&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;5&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/432/odl1_karaf.log.gz&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/432/odl1_karaf.log.gz&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;6&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/odl1_karaf.log.gz&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/odl1_karaf.log.gz&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;7&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/odl3_karaf.log.gz&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/releng/jenkins092/controller-csit-3node-clustering-all-carbon/418/odl3_karaf.log.gz&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="52403" author="rovarga" created="Mon, 11 Sep 2017 13:43:07 +0000"  >&lt;p&gt;This looks like we are failing to invalidate the cache after we have shut down the local member.&lt;/p&gt;

&lt;p&gt;Relevant logs:&lt;/p&gt;

&lt;p&gt;2017-08-24 15:24:08,268 | INFO  | h for user karaf | command                          | 498 - org.apache.karaf.log.command - 3.0.8 | ROBOT MESSAGE: Starting test Local_Leader_Shutdown&lt;br/&gt;
2017-08-24 15:24:13,620 | INFO  | qtp412422320-101 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Removing replica for shard default memberName member-1, datastoreType Config&lt;br/&gt;
2017-08-24 15:24:13,654 | INFO  | lt-dispatcher-26 | ClusterAdminRpcService           | 182 - org.opendaylight.controller.sal-cluster-admin-impl - 1.5.2.Carbon | Successfully removed replica for shard default&lt;br/&gt;
2017-08-24 15:24:13,670 | INFO  | rd-dispatcher-53 | tActorServerConfigurationSupport | 174 - org.opendaylight.controller.sal-akka-raft - 1.5.2.Carbon | member-1-shard-default-config: ServerConfigurationPayload [serverConfig=[ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-3-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;, ServerInfo &lt;span class=&quot;error&quot;&gt;&amp;#91;id=member-2-shard-default-config, isVoting=true&amp;#93;&lt;/span&gt;]] has been successfully replicated to a majority of followers&lt;br/&gt;
2017-08-24 15:24:13,681 | INFO  | rd-dispatcher-37 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged &lt;span class=&quot;error&quot;&gt;&amp;#91;memberId=member-1-shard-default-config, leaderId=null, leaderPayloadVersion=5&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-08-24 15:24:13,684 | INFO  | lt-dispatcher-25 | ClientActorBehavior              | 178 - org.opendaylight.controller.cds-access-client - 1.1.2.Carbon | member-1-frontend-datastore-config: connection ConnectedClientConnection{client=ClientIdentifier&lt;/p&gt;
{frontend=member-1-frontend-datastore-config, generation=0}
&lt;p&gt;, cookie=0, backend=ShardBackendInfo{actor=Actor&lt;a href=&quot;#513397858&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;akka://opendaylight-cluster-data/user/shardmanager-config/member-1-shard-default-config#513397858&lt;/a&gt;, sessionId=0, version=BORON, maxMessages=1000, cookie=0, shard=default, dataTree=present}} indicated no leadership, reconnecting it&lt;/p&gt;

&lt;p&gt;2017-08-24 15:24:14,715 | INFO  | rd-dispatcher-35 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received LeaderStateChanged message: LeaderStateChanged [memberId=member-1-shard-default-config, leaderId=null, leaderPayloadVersi&lt;br/&gt;
on=-1]&lt;br/&gt;
2017-08-24 15:24:14,715 | INFO  | rd-dispatcher-35 | ShardManager                     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | shard-manager-config: Received role changed for member-1-shard-default-config from Leader to Follower&lt;/p&gt;

&lt;p&gt;2017-08-24 15:24:15,708 | INFO  | rd-dispatcher-36 | aftActorLeadershipTransferCohort | 174 - org.opendaylight.controller.sal-akka-raft - 1.5.2.Carbon | member-1-shard-default-config: Successfully transferred leadership to null in 2.034 s&lt;br/&gt;
2017-08-24 15:24:15,719 | INFO  | rd-dispatcher-34 | Shard                            | 173 - org.opendaylight.controller.sal-clustering-commons - 1.5.2.Carbon | Stopping Shard member-1-shard-default-config&lt;/p&gt;


&lt;p&gt;After which we are continuing to get:&lt;/p&gt;


&lt;p&gt;2017-08-24 15:24:20,799 | WARN  | monPool-worker-3 | AbstractShardBackendResolver     | 180 - org.opendaylight.controller.sal-distributed-datastore - 1.5.2.Carbon | Failed to resolve shard&lt;br/&gt;
java.util.concurrent.TimeoutException: Connection attempt failed&lt;br/&gt;
        at org.opendaylight.controller.cluster.databroker.actors.dds.AbstractShardBackendResolver.wrap(AbstractShardBackendResolver.java:129)&lt;span class=&quot;error&quot;&gt;&amp;#91;180:org.opendaylight.controller.sal-distributed-datastore:1.5.2.Carbon&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at org.opendaylight.controller.cluster.databroker.actors.dds.AbstractShardBackendResolver.lambda$connectShard$2(AbstractShardBackendResolver.java:142)&lt;span class=&quot;error&quot;&gt;&amp;#91;180:org.opendaylight.controller.sal-distributed-datastore:1.5.2.Carbon&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:760)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:736)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.CompletableFuture$Completion.exec(CompletableFuture.java:443)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:289)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1056)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1692)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:157)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;br/&gt;
Caused by: akka.pattern.AskTimeoutException: Ask timed out on [ActorSelection&lt;span class=&quot;error&quot;&gt;&amp;#91;Anchor(akka://opendaylight-cluster-data/), Path(/user/shardmanager-config/member-1-shard-default-config)&amp;#93;&lt;/span&gt;] after &lt;span class=&quot;error&quot;&gt;&amp;#91;5000 ms&amp;#93;&lt;/span&gt;. Sender&lt;span class=&quot;error&quot;&gt;&amp;#91;null&amp;#93;&lt;/span&gt; sent message of type &quot;org.opendaylight.controller.cluster.access.commands.ConnectClientRequest&quot;.&lt;br/&gt;
        at akka.pattern.PromiseActorRef$$anonfun$1.apply$mcV$sp(AskSupport.scala:604)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.Scheduler$$anon$4.run(Scheduler.scala:126)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.unbatchedExecute(Future.scala:601)&lt;span class=&quot;error&quot;&gt;&amp;#91;150:org.scala-lang.scala-library:2.11.11.v20170413-090219-8a413ba7cc&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.BatchingExecutor$class.execute(BatchingExecutor.scala:109)&lt;span class=&quot;error&quot;&gt;&amp;#91;150:org.scala-lang.scala-library:2.11.11.v20170413-090219-8a413ba7cc&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.execute(Future.scala:599)&lt;span class=&quot;error&quot;&gt;&amp;#91;150:org.scala-lang.scala-library:2.11.11.v20170413-090219-8a413ba7cc&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$TaskHolder.executeTask(LightArrayRevolverScheduler.scala:329)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.executeBucket$1(LightArrayRevolverScheduler.scala:280)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.nextTick(LightArrayRevolverScheduler.scala:284)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.run(LightArrayRevolverScheduler.scala:236)&lt;span class=&quot;error&quot;&gt;&amp;#91;154:com.typesafe.akka.actor:2.4.18&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.lang.Thread.run(Thread.java:748)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_141&amp;#93;&lt;/span&gt;&lt;/p&gt;


&lt;p&gt;Which seems to be pointing to the local shard actor, which obviously, is not responding. I do not believe this is a problem in AbstractShardBackendResolver, but rather in ShardManager.&lt;/p&gt;</comment>
                            <comment id="52404" author="rovarga" created="Mon, 11 Sep 2017 13:48:47 +0000"  >&lt;p&gt;To clarify the error resolution process (via actorContext.findPrimaryShardAsync(String)) is returning the local actor ref, eventhough it was already shut down.&lt;/p&gt;

&lt;p&gt;This means that either primaryShardInfoCache is not invalidated, or ShardManager is returning the local actor when queried via FindPrimary.&lt;/p&gt;

&lt;p&gt;In both cases this looks like a problem with ShardManager.&lt;/p&gt;</comment>
                            <comment id="52405" author="rovarga" created="Mon, 11 Sep 2017 14:04:55 +0000"  >&lt;p&gt;Guesstimate fix: &lt;a href=&quot;https://git.opendaylight.org/gerrit/62973&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/62973&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="52406" author="vrpolak" created="Tue, 12 Sep 2017 12:36:32 +0000"  >&lt;p&gt;&amp;gt; Guesstimate fix: &lt;a href=&quot;https://git.opendaylight.org/gerrit/62973&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/62973&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Merged. Ongoing Sandbox test &lt;span class=&quot;error&quot;&gt;&amp;#91;9&amp;#93;&lt;/span&gt; suggests that fixes this.&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;9&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://jenkins.opendaylight.org/sandbox/job/controller-csit-3node-ddb-clean-lead-shutdown-longevity-only-carbon/3/console&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://jenkins.opendaylight.org/sandbox/job/controller-csit-3node-ddb-clean-lead-shutdown-longevity-only-carbon/3/console&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="52407" author="vrpolak" created="Wed, 13 Sep 2017 08:30:41 +0000"  >&lt;p&gt;&amp;gt; Sandbox test &lt;span class=&quot;error&quot;&gt;&amp;#91;9&amp;#93;&lt;/span&gt; suggests that fixes this.&lt;/p&gt;

&lt;p&gt;Run #2 has failed without this fix, after 35 iterations which took around 75 minutes.&lt;br/&gt;
Run #3 has passed with this fix, after 23 hours. Setting to VERIFIED.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                            <customfield id="customfield_11400" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10208" key="com.atlassian.jira.plugin.system.customfieldtypes:textfield">
                        <customfieldname>External issue ID</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>8639</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10201" key="com.atlassian.jira.plugin.system.customfieldtypes:url">
                        <customfieldname>External issue URL</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[https://bugs.opendaylight.org/show_bug.cgi?id=8639]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10206" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Issue Type</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10300"><![CDATA[Bug]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10204" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>ODL SR Target Milestone</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10337"><![CDATA[Carbon-SR2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                    <customfield id="customfield_10000" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>0|i02s9r:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>