<!-- 
RSS generated by JIRA (8.20.10#820010-sha1:ace47f9899e9ee25d7157d59aa17ab06aee30d3d) at Wed Feb 07 19:56:00 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>OpenDaylight JIRA</title>
    <link>https://jira.opendaylight.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>8.20.10</version>
        <build-number>820010</build-number>
        <build-date>22-06-2022</build-date>
    </build-info>


<item>
            <title>[CONTROLLER-1618] Scale testing: akka.pattern.AskTimeoutException ... after [30000 ms]</title>
                <link>https://jira.opendaylight.org/browse/CONTROLLER-1618</link>
                <project id="10113" key="CONTROLLER">controller</project>
                    <description>&lt;p&gt;Running scale tests on latest Boron code with a 3-node cluster.&lt;br/&gt;
ODL is part of an openstack, with 200 OVSs having a full-mesh of tunnels between them. 1 VM per OVS.&lt;br/&gt;
Everything seemed to work until around 196 VMS, but then creation of more VMs doesn&apos;t work anymore, and MD-SAL is throwing a lot of errors.&lt;br/&gt;
In the logs you can see I started the creation in 21/3/2017.&lt;br/&gt;
When I tried to create more VMs on the next day (22/3/2017) at around 11:33:24, I&apos;m starting to get many errors in ODL1.&lt;br/&gt;
ODL 1 interesting errors:&lt;br/&gt;
2017-03-22 11:41:22,908 | ERROR | lt-dispatcher-45 | LocalThreePhaseCommitCohort      | 175 - org.opendaylight.controller.sal-distributed-datastore - 1.4.3.SNAPSHOT | Failed to prepare transaction member-1-datastore-config-fe-0-txn-28762919 on backend&lt;br/&gt;
akka.pattern.AskTimeoutException: Ask timed out on &lt;a href=&quot;#-515521380)]&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;ActorSelection[Anchor(akka://opendaylight-cluster-data/), Path(/user/shardmanager-config/member-1-shard-inventory-config#-515521380)]&lt;/a&gt; after &lt;span class=&quot;error&quot;&gt;&amp;#91;30000 ms&amp;#93;&lt;/span&gt;. Sender&lt;span class=&quot;error&quot;&gt;&amp;#91;null&amp;#93;&lt;/span&gt; sent message of type &quot;org.opendaylight.controller.cluster.datastore.messages.ReadyLocalTransaction&quot;.&lt;br/&gt;
        at akka.pattern.PromiseActorRef$$anonfun$1.apply$mcV$sp(AskSupport.scala:604)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.Scheduler$$anon$4.run(Scheduler.scala:126)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.unbatchedExecute(Future.scala:601)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.BatchingExecutor$class.execute(BatchingExecutor.scala:109)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.execute(Future.scala:599)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$TaskHolder.executeTask(LightArrayRevolverScheduler.scala:331)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.executeBucket$1(LightArrayRevolverScheduler.scala:282)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.nextTick(LightArrayRevolverScheduler.scala:286)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.run(LightArrayRevolverScheduler.scala:238)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.lang.Thread.run(Thread.java:745)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_121&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-03-22 11:41:22,908 | ERROR | lt-dispatcher-59 | LocalThreePhaseCommitCohort      | 175 - org.opendaylight.controller.sal-distributed-datastore - 1.4.3.SNAPSHOT | Failed to prepare transaction member-1-datastore-config-fe-0-txn-28762921 on backend&lt;br/&gt;
akka.pattern.AskTimeoutException: Ask timed out on &lt;a href=&quot;#-515521380)]&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;ActorSelection[Anchor(akka://opendaylight-cluster-data/), Path(/user/shardmanager-config/member-1-shard-inventory-config#-515521380)]&lt;/a&gt; after &lt;span class=&quot;error&quot;&gt;&amp;#91;30000 ms&amp;#93;&lt;/span&gt;. Sender&lt;span class=&quot;error&quot;&gt;&amp;#91;null&amp;#93;&lt;/span&gt; sent message of type &quot;org.opendaylight.controller.cluster.datastore.messages.ReadyLocalTransaction&quot;.&lt;br/&gt;
        at akka.pattern.PromiseActorRef$$anonfun$1.apply$mcV$sp(AskSupport.scala:604)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.Scheduler$$anon$4.run(Scheduler.scala:126)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.unbatchedExecute(Future.scala:601)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.BatchingExecutor$class.execute(BatchingExecutor.scala:109)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.execute(Future.scala:599)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$TaskHolder.executeTask(LightArrayRevolverScheduler.scala:331)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.executeBucket$1(LightArrayRevolverScheduler.scala:282)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.nextTick(LightArrayRevolverScheduler.scala:286)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.run(LightArrayRevolverScheduler.scala:238)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.lang.Thread.run(Thread.java:745)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_121&amp;#93;&lt;/span&gt;&lt;br/&gt;
2017-03-22 11:41:22,908 | WARN  | t-dispatcher-134 | ConcurrentDOMDataBroker          | 175 - org.opendaylight.controller.sal-distributed-datastore - 1.4.3.SNAPSHOT | Tx: DOM-54456305 Error during phase CAN_COMMIT, starting Abort&lt;br/&gt;
akka.pattern.AskTimeoutException: Ask timed out on &lt;a href=&quot;#-515521380)]&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;ActorSelection[Anchor(akka://opendaylight-cluster-data/), Path(/user/shardmanager-config/member-1-shard-inventory-config#-515521380)]&lt;/a&gt; after &lt;span class=&quot;error&quot;&gt;&amp;#91;30000 ms&amp;#93;&lt;/span&gt;. Sender&lt;span class=&quot;error&quot;&gt;&amp;#91;null&amp;#93;&lt;/span&gt; sent message of type &quot;org.opendaylight.controller.cluster.datastore.messages.ReadyLocalTransaction&quot;.&lt;br/&gt;
        at akka.pattern.PromiseActorRef$$anonfun$1.apply$mcV$sp(AskSupport.scala:604)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.Scheduler$$anon$4.run(Scheduler.scala:126)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.unbatchedExecute(Future.scala:601)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.BatchingExecutor$class.execute(BatchingExecutor.scala:109)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at scala.concurrent.Future$InternalCallbackExecutor$.execute(Future.scala:599)&lt;span class=&quot;error&quot;&gt;&amp;#91;153:org.scala-lang.scala-library:2.11.8.v20160304-115712-1706a37eb8&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$TaskHolder.executeTask(LightArrayRevolverScheduler.scala:331)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.executeBucket$1(LightArrayRevolverScheduler.scala:282)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.nextTick(LightArrayRevolverScheduler.scala:286)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at akka.actor.LightArrayRevolverScheduler$$anon$4.run(LightArrayRevolverScheduler.scala:238)&lt;span class=&quot;error&quot;&gt;&amp;#91;157:com.typesafe.akka.actor:2.4.7&amp;#93;&lt;/span&gt;&lt;br/&gt;
        at java.lang.Thread.run(Thread.java:745)&lt;span class=&quot;error&quot;&gt;&amp;#91;:1.8.0_121&amp;#93;&lt;/span&gt;&lt;/p&gt;

&lt;p&gt;ODL 3 interesting errors:&lt;br/&gt;
2017-03-22 11:33:27,068 | ERROR | Pool-1-worker-37 | DataStoreJobCoordinator          | 283 - org.opendaylight.genius.mdsalutil-api - 0.1.3.SNAPSHOT | Exception when executing jobEntry: JobEntry&lt;/p&gt;
{key=&apos;MAC-00:1C:7
3:4E:D3:31 ELAN_TAG-5501DPN_ID-66396557993593&apos;, mainWorker=org.opendaylight.netvirt.elan.internal.ElanPacketInHandler$$Lambda$183/1454185117@69186057, rollbackWorker=null, retryCount=0, futures=null}
&lt;p&gt;java.lang.RuntimeException: java.util.concurrent.ExecutionException: ReadFailedException{message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02)elan-interfaces/elan-inter&lt;br/&gt;
face/elan-interface[&lt;/p&gt;
{(urn:opendaylight:netvirt:elan?revision=2015-06-02)name=tun816c0459241}
&lt;p&gt;], errorList=[RpcError [message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02&lt;br/&gt;
)elan-interfaces/elan-interface/elan-interface[&lt;/p&gt;
{(urn:opendaylight:netvirt:elan?revision=2015-06-02)name=tun816c0459241}
&lt;p&gt;], severity=ERROR, errorType=APPLICATION, tag=operation-failed, applicationTag=null, info=nu&lt;br/&gt;
ll, cause=java.lang.Exception: Error creating READ_ONLY transaction on shard default]]}&lt;br/&gt;
        at org.opendaylight.genius.mdsalutil.MDSALUtil.read(MDSALUtil.java:512)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.getElanInterfaceByElanInterfaceName(ElanUtils.java:364)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.getEtreeInterfaceByElanInterfaceName(ElanUtils.java:373)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.setupEtreeRemoteDmacFlow(ElanUtils.java:1103)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.setupRemoteDmacFlow(ElanUtils.java:1095)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.setupOrigDmacFlows(ElanUtils.java:954)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.utils.ElanUtils.setupMacFlows(ElanUtils.java:738)&lt;br/&gt;
        at org.opendaylight.netvirt.elan.internal.ElanPacketInHandler.lambda$enqueueJobForDPNSpecificTasks$1(ElanPacketInHandler.java:198)&lt;br/&gt;
        at org.opendaylight.genius.datastoreutils.DataStoreJobCoordinator$MainTask.run(DataStoreJobCoordinator.java:254)&lt;br/&gt;
        at java.util.concurrent.ForkJoinTask$RunnableExecuteAction.exec(ForkJoinTask.java:1402)&lt;br/&gt;
        at java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:289)&lt;br/&gt;
        at java.util.concurrent.ForkJoinPool$WorkQueue.runTask(ForkJoinPool.java:1056)&lt;br/&gt;
        at java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1692)&lt;br/&gt;
        at java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:157)&lt;br/&gt;
Caused by: java.util.concurrent.ExecutionException: ReadFailedException{message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02)elan-interfaces/elan-interface/elan-interfa&lt;br/&gt;
ce[&lt;/p&gt;
{(urn:opendaylight:netvirt:elan?revision=2015-06-02)name=tun816c0459241}
&lt;p&gt;], errorList=[RpcError [message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02)elan-interfaces/&lt;br/&gt;
elan-interface/elan-interface[&lt;/p&gt;
{(urn:opendaylight:netvirt:elan?revision=2015-06-02)name=tun816c0459241}
&lt;p&gt;], severity=ERROR, errorType=APPLICATION, tag=operation-failed, applicationTag=null, info=null, cause=java.la&lt;br/&gt;
ng.Exception: Error creating READ_ONLY transaction on shard default]]}&lt;br/&gt;
        at org.opendaylight.yangtools.util.concurrent.MappingCheckedFuture.wrapInExecutionException(MappingCheckedFuture.java:63)&lt;br/&gt;
        at org.opendaylight.yangtools.util.concurrent.MappingCheckedFuture.get(MappingCheckedFuture.java:76)&lt;br/&gt;
        at org.opendaylight.genius.mdsalutil.MDSALUtil.read(MDSALUtil.java:510)&lt;br/&gt;
        ... 13 more&lt;br/&gt;
Caused by: ReadFailedException{message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02)elan-interfaces/elan-interface/elan-interface[&lt;/p&gt;
{(urn:opendaylight:netvirt:elan?revisi
on=2015-06-02)name=tun816c0459241}
&lt;p&gt;], errorList=[RpcError [message=Error executeRead ReadData for path /(urn:opendaylight:netvirt:elan?revision=2015-06-02)elan-interfaces/elan-interface/elan-interface[&lt;/p&gt;
{(urn:opend
aylight:netvirt:elan?revision=2015-06-02)name=tun816c0459241}
&lt;p&gt;], severity=ERROR, errorType=APPLICATION, tag=operation-failed, applicationTag=null, info=null, cause=java.lang.Exception: Error creating READ_ONLY tr&lt;br/&gt;
ansaction on shard default]]}&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.NoOpTransactionContext.executeRead(NoOpTransactionContext.java:67)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.TransactionProxy$1.invoke(TransactionProxy.java:93)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.TransactionContextWrapper.executePriorTransactionOperations(TransactionContextWrapper.java:132)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.RemoteTransactionContextSupport.createTransactionContext(RemoteTransactionContextSupport.java:239)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.RemoteTransactionContextSupport.onCreateTransactionComplete(RemoteTransactionContextSupport.java:202)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.RemoteTransactionContextSupport.access$000(RemoteTransactionContextSupport.java:39)&lt;br/&gt;
        at org.opendaylight.controller.cluster.datastore.RemoteTransactionContextSupport$1.onComplete(RemoteTransactionContextSupport.java:137)&lt;br/&gt;
        at akka.dispatch.OnComplete.internal(Future.scala:258)&lt;br/&gt;
        at akka.dispatch.OnComplete.internal(Future.scala:256)&lt;br/&gt;
        at akka.dispatch.japi$CallbackBridge.apply(Future.scala:186)&lt;br/&gt;
        at akka.dispatch.japi$CallbackBridge.apply(Future.scala:183)&lt;br/&gt;
        at scala.concurrent.impl.CallbackRunnable.run(Promise.scala:32)&lt;br/&gt;
        at akka.dispatch.BatchingExecutor$AbstractBatch.processBatch(BatchingExecutor.scala:55)&lt;br/&gt;
        at akka.dispatch.BatchingExecutor$BlockableBatch$$anonfun$run$1.apply$mcV$sp(BatchingExecutor.scala:91)&lt;/p&gt;


&lt;p&gt;Ran jolokia/read/org.opendaylight.controller:Category=Shards,name=member-X-shard-topology-operational,type=DistributedOperationalDatastore on all ODLs.&lt;br/&gt;
Results:&lt;br/&gt;
ODL1:&lt;br/&gt;
{&quot;request&quot;:&lt;/p&gt;
{&quot;mbean&quot;:&quot;org.opendaylight.controller:Category=Shards,name=member-1-shard-topology-operational,type=DistributedOperationalDatastore&quot;,&quot;type&quot;:&quot;read&quot;}
&lt;p&gt;,&quot;value&quot;:&lt;/p&gt;
{&quot;ReadWriteTransactionCount&quot;:0,&quot;SnapshotIndex&quot;:2645417,&quot;InMemoryJournalLogSize&quot;:6,&quot;ReplicatedToAllIndex&quot;:2645417,&quot;Leader&quot;:&quot;member-3-shard-topology-operational&quot;,&quot;LastIndex&quot;:2645423,&quot;RaftState&quot;:&quot;Follower&quot;,&quot;LastApplied&quot;:2645423,&quot;LastCommittedTransactionTime&quot;:&quot;1970-01-01 02:00:00.000&quot;,&quot;LastLogIndex&quot;:2645423,&quot;LastLeadershipChangeTime&quot;:&quot;2017-03-21 18:06:45.018&quot;,&quot;PeerAddresses&quot;:&quot;member-2-shard-topology-operational: , member-3-shard-topology-operational: akka.tcp:\/\/opendaylight-cluster-data@172.16.1.153:2550\/user\/shardmanager-operational\/member-3-shard-topology-operational&quot;,&quot;WriteOnlyTransactionCount&quot;:0,&quot;FollowerInitialSyncStatus&quot;:true,&quot;FollowerInfo&quot;:[],&quot;FailedReadTransactionsCount&quot;:0,&quot;Voting&quot;:true,&quot;StatRetrievalTime&quot;:&quot;2.828 ms&quot;,&quot;CurrentTerm&quot;:1,&quot;LastTerm&quot;:1,&quot;FailedTransactionsCount&quot;:0,&quot;PendingTxCommitQueueSize&quot;:0,&quot;VotedFor&quot;:&quot;member-3-shard-topology-operational&quot;,&quot;SnapshotCaptureInitiated&quot;:false,&quot;CommittedTransactionsCount&quot;:0,&quot;TxCohortCacheSize&quot;:0,&quot;PeerVotingStates&quot;:&quot;member-2-shard-topology-operational: true, member-3-shard-topology-operational: true&quot;,&quot;LastLogTerm&quot;:1,&quot;StatRetrievalError&quot;:null,&quot;CommitIndex&quot;:2645423,&quot;SnapshotTerm&quot;:1,&quot;AbortTransactionsCount&quot;:0,&quot;ReadOnlyTransactionCount&quot;:0,&quot;ShardName&quot;:&quot;member-1-shard-topology-operational&quot;,&quot;LeadershipChangeCount&quot;:1,&quot;InMemoryJournalDataSize&quot;:7452}
&lt;p&gt;,&quot;timestamp&quot;:1490175963,&quot;status&quot;:200}&lt;br/&gt;
ODL2:&lt;br/&gt;
{&quot;request&quot;:&lt;/p&gt;
{&quot;mbean&quot;:&quot;org.opendaylight.controller:Category=Shards,name=member-2-shard-topology-operational,type=DistributedOperationalDatastore&quot;,&quot;type&quot;:&quot;read&quot;}
&lt;p&gt;,&quot;value&quot;:&lt;/p&gt;
{&quot;ReadWriteTransactionCount&quot;:0,&quot;SnapshotIndex&quot;:2645983,&quot;InMemoryJournalLogSize&quot;:3,&quot;ReplicatedToAllIndex&quot;:2645983,&quot;Leader&quot;:&quot;member-3-shard-topology-operational&quot;,&quot;LastIndex&quot;:2645986,&quot;RaftState&quot;:&quot;Follower&quot;,&quot;LastCommittedTransactionTime&quot;:&quot;1970-01-01 02:00:00.000&quot;,&quot;LastApplied&quot;:2645985,&quot;LastLogIndex&quot;:2645986,&quot;LastLeadershipChangeTime&quot;:&quot;2017-03-21 18:06:45.011&quot;,&quot;PeerAddresses&quot;:&quot;member-1-shard-topology-operational: , member-3-shard-topology-operational: akka.tcp:\/\/opendaylight-cluster-data@172.16.1.153:2550\/user\/shardmanager-operational\/member-3-shard-topology-operational&quot;,&quot;WriteOnlyTransactionCount&quot;:0,&quot;FollowerInitialSyncStatus&quot;:true,&quot;FollowerInfo&quot;:[],&quot;FailedReadTransactionsCount&quot;:0,&quot;StatRetrievalTime&quot;:&quot;11.85 ms&quot;,&quot;Voting&quot;:true,&quot;CurrentTerm&quot;:1,&quot;LastTerm&quot;:1,&quot;FailedTransactionsCount&quot;:0,&quot;PendingTxCommitQueueSize&quot;:0,&quot;VotedFor&quot;:&quot;member-3-shard-topology-operational&quot;,&quot;SnapshotCaptureInitiated&quot;:false,&quot;CommittedTransactionsCount&quot;:0,&quot;TxCohortCacheSize&quot;:0,&quot;PeerVotingStates&quot;:&quot;member-1-shard-topology-operational: true, member-3-shard-topology-operational: true&quot;,&quot;LastLogTerm&quot;:1,&quot;StatRetrievalError&quot;:null,&quot;CommitIndex&quot;:2645985,&quot;SnapshotTerm&quot;:1,&quot;AbortTransactionsCount&quot;:0,&quot;ReadOnlyTransactionCount&quot;:0,&quot;ShardName&quot;:&quot;member-2-shard-topology-operational&quot;,&quot;LeadershipChangeCount&quot;:1,&quot;InMemoryJournalDataSize&quot;:3726}
&lt;p&gt;,&quot;timestamp&quot;:1490175977,&quot;status&quot;:200}&lt;br/&gt;
ODL3:&lt;br/&gt;
{&quot;request&quot;:&lt;/p&gt;
{&quot;mbean&quot;:&quot;org.opendaylight.controller:Category=Shards,name=member-3-shard-topology-operational,type=DistributedOperationalDatastore&quot;,&quot;type&quot;:&quot;read&quot;}
&lt;p&gt;,&quot;value&quot;:{&quot;ReadWriteTransactionCount&quot;:881228,&quot;SnapshotIndex&quot;:2646308,&quot;InMemoryJournalLogSize&quot;:5,&quot;ReplicatedToAllIndex&quot;:2646308,&quot;Leader&quot;:&quot;member-3-shard-topology-operational&quot;,&quot;LastIndex&quot;:2646313,&quot;RaftState&quot;:&quot;Leader&quot;,&quot;LastCommittedTransactionTime&quot;:&quot;2017-03-22 11:46:26.848&quot;,&quot;LastApplied&quot;:2646313,&quot;LastLeadershipChangeTime&quot;:&quot;2017-03-21 18:06:44.977&quot;,&quot;LastLogIndex&quot;:2646313,&quot;PeerAddresses&quot;:&quot;member-1-shard-topology-operational: akka.tcp:\/\/opendaylight-cluster-data@172.16.1.142:2550\/user\/shardmanager-operational\/member-1-shard-topology-operational, member-2-shard-topology-operational: akka.tcp:\/\/opendaylight-cluster-data@172.16.1.136:2550\/user\/shardmanager-operational\/member-2-shard-topology-operational&quot;,&quot;FollowerInitialSyncStatus&quot;:false,&quot;WriteOnlyTransactionCount&quot;:0,&quot;FollowerInfo&quot;:[{&quot;timeSinceLastActivity&quot;:&quot;00:00:00.070&quot;,&quot;active&quot;:true,&quot;matchIndex&quot;:2646308,&quot;voting&quot;:&lt;/p&gt;</description>
                <environment>&lt;p&gt;Operating System: All&lt;br/&gt;
Platform: All&lt;/p&gt;</environment>
        <key id="26172">CONTROLLER-1618</key>
            <summary>Scale testing: akka.pattern.AskTimeoutException ... after [30000 ms]</summary>
                <type id="10104" iconUrl="https://jira.opendaylight.org/secure/viewavatar?size=xsmall&amp;avatarId=10303&amp;avatarType=issuetype">Bug</type>
                                                <status id="5" iconUrl="https://jira.opendaylight.org/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="green"/>
                                    <resolution id="10002">Duplicate</resolution>
                                        <assignee username="-1">Unassigned</assignee>
                                    <reporter username="guy.sela@hpe.com">Guy Sela</reporter>
                        <labels>
                    </labels>
                <created>Wed, 22 Mar 2017 10:06:52 +0000</created>
                <updated>Tue, 25 Jul 2023 08:24:27 +0000</updated>
                            <resolved>Wed, 12 Apr 2017 02:56:41 +0000</resolved>
                                                                    <component>clustering</component>
                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                                                                <comments>
                            <comment id="51843" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:06:52 +0000"  >&lt;p&gt;Attachment odl2.tar.gz has been added with description: ODL2 Logs&lt;/p&gt;</comment>
                            <comment id="51844" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:07:20 +0000"  >&lt;p&gt;Attachment odl3-part1.tar.gz has been added with description: Odl3 logs part 1&lt;/p&gt;</comment>
                            <comment id="51845" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:07:41 +0000"  >&lt;p&gt;Attachment odl3-part2.tar.gz has been added with description: Odl3 logs part 2&lt;/p&gt;</comment>
                            <comment id="51846" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:04 +0000"  >&lt;p&gt;Attachment odl1-part1.tar.gz has been added with description: ODL1 logs part 1&lt;/p&gt;</comment>
                            <comment id="51847" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:24 +0000"  >&lt;p&gt;Attachment odl1-part2.tar.gz has been added with description: ODL1 logs part 2&lt;/p&gt;</comment>
                            <comment id="51848" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:41 +0000"  >&lt;p&gt;Attachment odl1-part3.tar.gz has been added with description: ODL1 logs part 3&lt;/p&gt;</comment>
                            <comment id="51849" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:57 +0000"  >&lt;p&gt;Attachment odl1-part4.tar.gz has been added with description: ODL1 logs part 4&lt;/p&gt;</comment>
                            <comment id="51850" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:09:12 +0000"  >&lt;p&gt;Attachment odl1-part5.tar.gz has been added with description: ODL1 logs part 5&lt;/p&gt;</comment>
                            <comment id="51851" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:09:24 +0000"  >&lt;p&gt;Attachment odl1-part6.tar.gz has been added with description: ODL1 logs part 6&lt;/p&gt;</comment>
                            <comment id="51835" author="tpantelis" created="Wed, 22 Mar 2017 18:27:38 +0000"  >&lt;p&gt;Where&apos;s the rest of the jolokia output from ODL3? ODL3 was the leader so it&apos;s important  to see all the output.&lt;/p&gt;

&lt;p&gt;In any event, there were over 2.6M transactions generate in shard topology-operational - pretty high volume. However the timeout errors occurred for shard inventory-config. What volume of transactions are occurring for inventory-config? It would be useful to see the jolokia output.&lt;/p&gt;

&lt;p&gt;This is probably the same as &lt;a href=&quot;https://jira.opendaylight.org/browse/CONTROLLER-1483&quot; title=&quot;akka.pattern.AskTimeoutException on follower while BGP peer introduces 1M prefixes&quot; class=&quot;issue-link&quot; data-issue-key=&quot;CONTROLLER-1483&quot;&gt;&lt;del&gt;CONTROLLER-1483&lt;/del&gt;&lt;/a&gt; - the volume of client transactions overloads the shards. At some point, it will saturate, i.e. the backend replication can&apos;t keep up with the front-end client rate. &lt;/p&gt;

&lt;p&gt;It would be useful to profile the CPU/memory usage and GC activity as the test is running. Also how much memory was allocated to the JVM? Is it enough?&lt;/p&gt;</comment>
                            <comment id="51836" author="guy.sela@hpe.com" created="Thu, 23 Mar 2017 09:27:14 +0000"  >&lt;p&gt;&amp;gt;&amp;gt; Where&apos;s the rest of the jolokia output from ODL3? ODL3 was the leader so it&apos;s &amp;gt;&amp;gt; important  to see all the output.&lt;br/&gt;
Weird I thought I copied everything, if I&apos;ll reproduce I&apos;ll re paste here.&lt;/p&gt;

&lt;p&gt;&amp;gt;&amp;gt; In any event, there were over 2.6M transactions generate in shard topology-operational - pretty high volume. &lt;br/&gt;
&amp;gt;&amp;gt; However the timeout errors occurred for shard inventory-config. What volume of &amp;gt;&amp;gt; transactions are occurring for inventory-config? It would be useful to see the &amp;gt;&amp;gt; jolokia output.&lt;br/&gt;
Regarding the jolokia output, what kind of query do you need me to run ?&lt;br/&gt;
Regarding the volume, I am not a netvirt expert, we can ask the netvirt-dev, but we are talking about 200 OVSs, with 1 VM per OVS. The VMs are spawned at a rate of about 1 per 7 seconds, so the rate is very low. Of course every spawn of a VM in a mesh of tunnels causes a creation of many tunnels, but still, the rate is very slow.&lt;/p&gt;

&lt;p&gt;This is probably the same as &lt;a href=&quot;https://jira.opendaylight.org/browse/CONTROLLER-1483&quot; title=&quot;akka.pattern.AskTimeoutException on follower while BGP peer introduces 1M prefixes&quot; class=&quot;issue-link&quot; data-issue-key=&quot;CONTROLLER-1483&quot;&gt;&lt;del&gt;CONTROLLER-1483&lt;/del&gt;&lt;/a&gt; - the volume of client transactions overloads the shards. At some point, it will saturate, i.e. the backend replication can&apos;t keep up with the front-end client rate. &lt;/p&gt;

&lt;p&gt;&amp;gt;&amp;gt; It would be useful to profile the CPU/memory usage and GC activity as the test &amp;gt;&amp;gt; is running. Also how much memory was allocated to the JVM? Is it enough?&lt;br/&gt;
GC activity is found in karaf.out - should be attached for every ODL.&lt;br/&gt;
Memory-wise we are talking about a 24G Heap, and we are using the G1 Collector.&lt;/p&gt;</comment>
                            <comment id="51837" author="rovarga" created="Thu, 23 Mar 2017 12:35:01 +0000"  >&lt;p&gt;That number of transactions is alarming &amp;#8211; I think we should be teaching netvirt about transaction chains and pingpong...&lt;/p&gt;

&lt;p&gt;At any rate, this is definitely a duplicate of 5280.&lt;/p&gt;</comment>
                            <comment id="51838" author="guy.sela@hpe.com" created="Thu, 23 Mar 2017 12:42:25 +0000"  >&lt;p&gt;1) How do you know how many transactions happen per second ? This must be the more interesting number. &lt;br/&gt;
2) Can you tell the total amount of transactions before the ERRORS start to happen?&lt;/p&gt;</comment>
                            <comment id="51839" author="guy.sela@hpe.com" created="Thu, 23 Mar 2017 16:29:36 +0000"  >&lt;p&gt;CPU usage is around 120% on a 45 cores system (Which means it can get up to 4500%).&lt;br/&gt;
One of the cores is almost constantly on 100%.&lt;/p&gt;</comment>
                            <comment id="51840" author="guy.sela@hpe.com" created="Thu, 23 Mar 2017 16:32:29 +0000"  >&lt;p&gt;Some of the time the system is at around 300% CPU from potential 4500%&lt;/p&gt;</comment>
                            <comment id="51841" author="rovarga" created="Thu, 23 Mar 2017 16:43:20 +0000"  >&lt;p&gt;Re. 1) it&apos;s just a guess &amp;#8211; the combination of the two things brings about batching, which reduces the number of transactions significantly &amp;#8211; 100:1 is usual in BGP. It also has the added benefit of spreading the workload across multiple threads.&lt;/p&gt;

&lt;p&gt;Re. 2) there are no hard guidelines on when AskTimeouts start to happen &amp;#8211; they happen if the backend cannot keep up with the frontend and that depends on a large number of factors:&lt;/p&gt;
&lt;ul class=&quot;alternate&quot; type=&quot;square&quot;&gt;
	&lt;li&gt;inter-node connectivity&lt;/li&gt;
	&lt;li&gt;GCs&lt;/li&gt;
	&lt;li&gt;snapshots&lt;/li&gt;
	&lt;li&gt;overall volume of data already stored&lt;/li&gt;
	&lt;li&gt;transaction size&lt;/li&gt;
	&lt;li&gt;modification rate&lt;/li&gt;
	&lt;li&gt;storage performance&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="51842" author="tpantelis" created="Fri, 24 Mar 2017 00:46:59 +0000"  >&lt;p&gt;The TransactionCreationRateLimit JMX attribute under DistributedOperationalDatastore gives a pretty good idea of transactions per sec. This is the calculated rate limit used to throttle transactions on the front-end.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10002">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="26037">CONTROLLER-1483</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="13621" name="odl1-part1.tar.gz" size="768917" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:04 +0000"/>
                            <attachment id="13622" name="odl1-part2.tar.gz" size="861371" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:24 +0000"/>
                            <attachment id="13623" name="odl1-part3.tar.gz" size="939707" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:41 +0000"/>
                            <attachment id="13624" name="odl1-part4.tar.gz" size="292448" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:08:57 +0000"/>
                            <attachment id="13625" name="odl1-part5.tar.gz" size="309660" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:09:12 +0000"/>
                            <attachment id="13626" name="odl1-part6.tar.gz" size="30512" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:09:24 +0000"/>
                            <attachment id="13618" name="odl2.tar.gz" size="515685" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:06:52 +0000"/>
                            <attachment id="13619" name="odl3-part1.tar.gz" size="925579" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:07:20 +0000"/>
                            <attachment id="13620" name="odl3-part2.tar.gz" size="421719" author="guy.sela@hpe.com" created="Wed, 22 Mar 2017 10:07:41 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                            <customfield id="customfield_11400" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10208" key="com.atlassian.jira.plugin.system.customfieldtypes:textfield">
                        <customfieldname>External issue ID</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>8041</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10201" key="com.atlassian.jira.plugin.system.customfieldtypes:url">
                        <customfieldname>External issue URL</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[https://bugs.opendaylight.org/show_bug.cgi?id=8041]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                <customfield id="customfield_10000" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>0|i02ron:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>