<!-- 
RSS generated by JIRA (8.20.10#820010-sha1:ace47f9899e9ee25d7157d59aa17ab06aee30d3d) at Wed Feb 07 19:56:23 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>OpenDaylight JIRA</title>
    <link>https://jira.opendaylight.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>8.20.10</version>
        <build-number>820010</build-number>
        <build-date>22-06-2022</build-date>
    </build-info>


<item>
            <title>[CONTROLLER-1757] Singleton leader chasing exhausts heap space in few hours</title>
                <link>https://jira.opendaylight.org/browse/CONTROLLER-1757</link>
                <project id="10113" key="CONTROLLER">controller</project>
                    <description>&lt;p&gt;This bug is not (yet) present in Carbon code. This Bug is affecting changes proposed around SR2 branch lock. Reporting, as this will probably prevent some fixes to be merged into SR2 candidate build.&lt;/p&gt;

&lt;p&gt;The exact build where this Bug happens is &lt;span class=&quot;error&quot;&gt;&amp;#91;0&amp;#93;&lt;/span&gt; which was intended to fix &lt;a href=&quot;https://jira.opendaylight.org/browse/MDSAL-275&quot; title=&quot;VerifyException from flapping service singleton registration&quot; class=&quot;issue-link&quot; data-issue-key=&quot;MDSAL-275&quot;&gt;&lt;del&gt;MDSAL-275&lt;/del&gt;&lt;/a&gt;. Which it does, but apparently there is a memory leak somewhere.&lt;/p&gt;

&lt;p&gt;Logs for the Sandbox run are here &lt;span class=&quot;error&quot;&gt;&amp;#91;1&amp;#93;&lt;/span&gt;, karaf.log files show UnreachableMember starts happening around three and half hours into the test duration (corresponding to GC pauses of 5 and more seconds), gclogs directories show that members 1 and 3 end with allocation failure not recoverable by GCaround 19 hours after the test starts. It is not clear whether heap dumps were created, they certainly have not been archived.&lt;/p&gt;

&lt;p&gt;Patches that were included in the build are: &lt;span class=&quot;error&quot;&gt;&amp;#91;2&amp;#93;&lt;/span&gt;, &lt;span class=&quot;error&quot;&gt;&amp;#91;3&amp;#93;&lt;/span&gt; (with its ancestors) and &lt;span class=&quot;error&quot;&gt;&amp;#91;4&amp;#93;&lt;/span&gt;.&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;0&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://nexus.opendaylight.org/content/repositories/opendaylight.snapshot/org/opendaylight/integration/integration/distribution/distribution-karaf/0.6.2-SNAPSHOT/distribution-karaf-0.6.2-20170823.082806-47.zip&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://nexus.opendaylight.org/content/repositories/opendaylight.snapshot/org/opendaylight/integration/integration/distribution/distribution-karaf/0.6.2-SNAPSHOT/distribution-karaf-0.6.2-20170823.082806-47.zip&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;1&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://logs.opendaylight.org/sandbox/jenkins091/controller-csit-3node-cs-chasing-leader-longevity-only-carbon/14/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://logs.opendaylight.org/sandbox/jenkins091/controller-csit-3node-cs-chasing-leader-longevity-only-carbon/14/&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://git.opendaylight.org/gerrit/#/c/61420/18&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/#/c/61420/18&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;3&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://git.opendaylight.org/gerrit/#/c/62170/4&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/#/c/62170/4&lt;/a&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;4&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://git.opendaylight.org/gerrit/#/c/62140/1&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/#/c/62140/1&lt;/a&gt;&lt;/p&gt;</description>
                <environment>&lt;p&gt;Operating System: All&lt;br/&gt;
Platform: All&lt;/p&gt;</environment>
        <key id="26311">CONTROLLER-1757</key>
            <summary>Singleton leader chasing exhausts heap space in few hours</summary>
                <type id="10104" iconUrl="https://jira.opendaylight.org/secure/viewavatar?size=xsmall&amp;avatarId=10303&amp;avatarType=issuetype">Bug</type>
                                                <status id="5" iconUrl="https://jira.opendaylight.org/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="green"/>
                                    <resolution id="10000">Done</resolution>
                                        <assignee username="rovarga">Robert Varga</assignee>
                                    <reporter username="vrpolak">Vratko Polak</reporter>
                        <labels>
                    </labels>
                <created>Fri, 25 Aug 2017 11:06:43 +0000</created>
                <updated>Wed, 6 Sep 2017 12:09:19 +0000</updated>
                            <resolved>Wed, 6 Sep 2017 12:09:19 +0000</resolved>
                                    <version>Carbon</version>
                                                    <component>clustering</component>
                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                                                                <comments>
                            <comment id="52630" author="rovarga" created="Fri, 25 Aug 2017 22:06:17 +0000"  >&lt;p&gt;The patch for &lt;a href=&quot;https://jira.opendaylight.org/browse/MDSAL-275&quot; title=&quot;VerifyException from flapping service singleton registration&quot; class=&quot;issue-link&quot; data-issue-key=&quot;MDSAL-275&quot;&gt;&lt;del&gt;MDSAL-275&lt;/del&gt;&lt;/a&gt; allows us to run cluster singleton much hotter than before (60-110tps vs. 5tps). 19 hour run at 60tps translates roughly to 19*3600*60*4 ~= 16M transactions.&lt;/p&gt;

&lt;p&gt;I suspect this is a EOS-specific rehash of &lt;a href=&quot;https://jira.opendaylight.org/browse/CONTROLLER-1746&quot; title=&quot;OOM with large number of closed transactions&quot; class=&quot;issue-link&quot; data-issue-key=&quot;CONTROLLER-1746&quot;&gt;&lt;del&gt;CONTROLLER-1746&lt;/del&gt;&lt;/a&gt; as EOS is a subclass of Shard and I suspect it interacts directly with ShardDataTree (and hence needs to play nice a purge its transactions).&lt;/p&gt;</comment>
                            <comment id="52631" author="rovarga" created="Wed, 30 Aug 2017 14:00:18 +0000"  >&lt;p&gt;I have re-created this in a unit test. It seems that this is coming from FrontendHistoryMetadataBuilder.purgedTransactions, which is not contiguous as expected, hence the RangeSet is not compressing properly.&lt;/p&gt;

&lt;p&gt;This seems to be coming from EntityOwnershipShard and its CommitCoordinator, which manually allocate transaction IDs for BatchedModifications, but those IDs are not contiguous:&lt;/p&gt;

&lt;p&gt;03:08:29,127 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-14&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59606-0, size 2&lt;br/&gt;
03:08:29,134 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-14&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59608-0, size 1&lt;br/&gt;
03:08:29,177 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59612-0, size 2&lt;br/&gt;
03:08:29,197 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-19&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59617-0, size 3&lt;br/&gt;
03:08:29,215 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-19&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59619-0, size 1&lt;br/&gt;
03:08:29,243 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-19&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59622-0, size 2&lt;br/&gt;
03:08:29,281 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-20&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59626-0, size 2&lt;br/&gt;
03:08:29,324 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-19&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59629-0, size 1&lt;br/&gt;
03:08:29,348 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-20&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59632-0, size 2&lt;br/&gt;
03:08:29,367 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-20&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59634-0, size 1&lt;br/&gt;
03:08:29,399 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59637-0, size 2&lt;br/&gt;
03:08:29,413 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59639-0, size 1&lt;br/&gt;
03:08:29,439 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59643-0, size 3&lt;br/&gt;
03:08:29,473 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59646-0, size 1&lt;br/&gt;
03:08:29,513 PM &lt;span class=&quot;error&quot;&gt;&amp;#91;cluster-test-shard-dispatcher-11&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;DEBUG&amp;#93;&lt;/span&gt; EntityOwnershipShard - Committing next BatchedModifications member-1-entity-ownership-internal-fe-0-txn-59650-0, size 3&lt;/p&gt;

&lt;p&gt;The fix for BUG-8858 is just flushing this out because it can tear through many more transitions, hence generates many more transactions.&lt;/p&gt;</comment>
                            <comment id="52632" author="rovarga" created="Wed, 30 Aug 2017 14:03:41 +0000"  >&lt;p&gt;&lt;a href=&quot;https://git.opendaylight.org/gerrit/62449&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/62449&lt;/a&gt; is the unit test showing the problem.&lt;/p&gt;</comment>
                            <comment id="52633" author="rovarga" created="Wed, 30 Aug 2017 14:41:06 +0000"  >&lt;p&gt;I think the problem is coming from early allocation of transaction ID in EntityOwnershipShardCommitCoordinator.newBatchedModifications(), which is then state compressed and not committed.&lt;/p&gt;

&lt;p&gt;Patch &lt;a href=&quot;https://git.opendaylight.org/gerrit/62453&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/62453&lt;/a&gt; modifies EOS to allocate BatchedModifications (and transaction ID) only just before we send it to the backend.-&lt;/p&gt;</comment>
                            <comment id="52634" author="rovarga" created="Wed, 30 Aug 2017 14:59:38 +0000"  >&lt;p&gt;This is a Carbon -&amp;gt; Carbon SR1 regression, although the memory leak usually occurs very slowly.&lt;/p&gt;</comment>
                            <comment id="52635" author="vrpolak" created="Wed, 6 Sep 2017 12:09:19 +0000"  >&lt;p&gt;&amp;gt; Patch &lt;a href=&quot;https://git.opendaylight.org/gerrit/62453&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/62453&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Looks like everything has been merged.&lt;br/&gt;
Verification will be this &lt;span class=&quot;error&quot;&gt;&amp;#91;7&amp;#93;&lt;/span&gt; CSIT job passing, but I believe FIXED is the correct status right now.&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;7&amp;#93;&lt;/span&gt; &lt;a href=&quot;https://jenkins.opendaylight.org/releng/view/controller/job/controller-csit-3node-cs-chasing-leader-longevity-only-carbon/21/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://jenkins.opendaylight.org/releng/view/controller/job/controller-csit-3node-cs-chasing-leader-longevity-only-carbon/21/&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10000">
                    <name>Blocks</name>
                                            <outwardlinks description="blocks">
                                        <issuelink>
            <issuekey id="27097">MDSAL-275</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                            <customfield id="customfield_11400" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10208" key="com.atlassian.jira.plugin.system.customfieldtypes:textfield">
                        <customfieldname>External issue ID</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9054</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10201" key="com.atlassian.jira.plugin.system.customfieldtypes:url">
                        <customfieldname>External issue URL</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[https://bugs.opendaylight.org/show_bug.cgi?id=9054]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10206" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Issue Type</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10300"><![CDATA[Bug]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10204" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>ODL SR Target Milestone</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10337"><![CDATA[Carbon-SR2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                    <customfield id="customfield_10000" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>0|i02sjj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>