<!-- 
RSS generated by JIRA (8.20.10#820010-sha1:ace47f9899e9ee25d7157d59aa17ab06aee30d3d) at Wed Feb 07 19:59:54 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>OpenDaylight JIRA</title>
    <link>https://jira.opendaylight.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>8.20.10</version>
        <build-number>820010</build-number>
        <build-date>22-06-2022</build-date>
    </build-info>


<item>
            <title>[GENIUS-96] DataStoreJobCoordinator OOM</title>
                <link>https://jira.opendaylight.org/browse/GENIUS-96</link>
                <project id="10126" key="GENIUS">genius</project>
                    <description>&lt;p&gt;Internal downstream testing reports OOM with latest stable/nitrogen builds.&lt;/p&gt;

&lt;p&gt;HPROF analysis by MAT points to something really badly wrong in DataStoreJobCoordinator.&lt;/p&gt;

&lt;p&gt;see attached ZIP&lt;/p&gt;</description>
                <environment></environment>
        <key id="28693">GENIUS-96</key>
            <summary>DataStoreJobCoordinator OOM</summary>
                <type id="10104" iconUrl="https://jira.opendaylight.org/secure/viewavatar?size=xsmall&amp;avatarId=10303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.opendaylight.org/images/icons/priorities/blocker.svg">Highest</priority>
                        <status id="10004" iconUrl="https://jira.opendaylight.org/images/icons/status_generic.gif" description="">Verified</status>
                    <statusCategory id="3" key="done" colorName="green"/>
                                    <resolution id="10003">Cannot Reproduce</resolution>
                                        <assignee username="vorburger">Michael Vorburger</assignee>
                                    <reporter username="vorburger">Michael Vorburger</reporter>
                        <labels>
                    </labels>
                <created>Fri, 3 Nov 2017 21:51:32 +0000</created>
                <updated>Thu, 19 Apr 2018 14:41:46 +0000</updated>
                            <resolved>Thu, 19 Apr 2018 14:41:46 +0000</resolved>
                                    <version>Nitrogen-SR1</version>
                                    <fixVersion>Nitrogen-SR1</fixVersion>
                                    <component>General</component>
                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                                                                <comments>
                            <comment id="59911" author="vorburger" created="Fri, 3 Nov 2017 22:38:36 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.opendaylight.org/secure/ViewProfile.jspa?name=tpantelis&quot; class=&quot;user-hover&quot; rel=&quot;tpantelis&quot;&gt;tpantelis&lt;/a&gt; dixit:&lt;/p&gt;

&lt;blockquote&gt;&lt;p&gt;maybe some job got stuck or took a long time and backed up a queue&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;This somehow sounds familiar - didn&apos;t you mention something like this somewhere recently, &lt;a href=&quot;https://jira.opendaylight.org/secure/ViewProfile.jspa?name=k.faseela&quot; class=&quot;user-hover&quot; rel=&quot;k.faseela&quot;&gt;k.faseela&lt;/a&gt; ?&lt;/p&gt;

&lt;p&gt;BTW this reminds me that during the code reviews of the genius DJC to infrautils JC we added this to the JavaDoc:&lt;/p&gt;

&lt;blockquote&gt;&lt;p&gt;Enqueued jobs are stored in unbounded queues until they are run, this should be kept in mind as it might lead to an OOM.&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;and now that ^^^ is exactly what happened here... it would probably be better if we made the JobCoordinator reject jobs after a certain (configurable) capacity? And start dumping whatever is stuck in the queue at that point?&lt;/p&gt;</comment>
                            <comment id="59915" author="faseela.k@ericsson.com" created="Sat, 4 Nov 2017 02:02:46 +0000"  >&lt;p&gt;Yeah..this is what even I was proposing that day. &lt;br/&gt;
In one of our testing, saw that two Jobs were in deadlock, and enough of such jobs were queued up to take up all available threads, and none of the new jobs had resources to get executed. &lt;br/&gt;
Taking a jstack output at that time helped us understand the culprit.&lt;/p&gt;</comment>
                            <comment id="59917" author="vorburger" created="Sat, 4 Nov 2017 02:20:03 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.opendaylight.org/browse/INFRAUTILS-24&quot; title=&quot;JobCoordinator should use bounded Executors and bound its own job queue&quot; class=&quot;issue-link&quot; data-issue-key=&quot;INFRAUTILS-24&quot;&gt;&lt;del&gt;INFRAUTILS-24&lt;/del&gt;&lt;/a&gt; will make the JobCoordinator reject jobs to avoid the such OOMs in the future. We need to fix the bug hit during testing in this JIRA issue; I&apos;ll get jstack.&lt;/p&gt;</comment>
                            <comment id="59920" author="vorburger" created="Sat, 4 Nov 2017 02:58:55 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.opendaylight.org/secure/ViewProfile.jspa?name=k.faseela&quot; class=&quot;user-hover&quot; rel=&quot;k.faseela&quot;&gt;k.faseela&lt;/a&gt; said on IRC that earlier patch sets of &lt;a href=&quot;https://git.opendaylight.org/gerrit/#/c/63884/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/#/c/63884/&lt;/a&gt; caused this kind of problem, but that the final one (which also went into nitrogen) &quot;should&quot; have fixed the deadlock. So when we get the jstack, we should watch out whether it looks like it could have anything to do with that change, just to be sure. (She also mentioned that there will be a follow up patch which will fix something re. a &quot;slowing down of the DJC&quot;, but that&apos;s not related to deadlock / OOM, AFAIK.)&lt;/p&gt;</comment>
                            <comment id="59926" author="faseela.k@ericsson.com" created="Sun, 5 Nov 2017 18:04:09 +0000"  >&lt;p&gt;&lt;a href=&quot;https://git.opendaylight.org/gerrit/65146&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/65146&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;This will have some impact?&lt;/p&gt;</comment>
                            <comment id="59930" author="faseela.k@ericsson.com" created="Mon, 6 Nov 2017 11:07:02 +0000"  >&lt;p&gt;Kency indicated that there were some lockmanager related issues which used to make some jobs stuck in DJC, which is fixed under below review :&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://git.opendaylight.org/gerrit/#/c/61977/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://git.opendaylight.org/gerrit/#/c/61977/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Could you please review and merge?&lt;/p&gt;</comment>
                            <comment id="59944" author="klou" created="Mon, 6 Nov 2017 20:46:45 +0000"  >&lt;p&gt;Is this issue related to &lt;a href=&quot;https://jira.opendaylight.org/browse/NETVIRT-974&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;https://jira.opendaylight.org/browse/NETVIRT-974&lt;/a&gt; ?&lt;/p&gt;

&lt;p&gt;Is this truly a blocker for Nitrogen-SR1?  Thanks!&lt;/p&gt;</comment>
                            <comment id="59950" author="vorburger" created="Mon, 6 Nov 2017 22:18:06 +0000"  >&lt;p&gt;&amp;gt; Is this issue related to &lt;a href=&quot;https://jira.opendaylight.org/browse/NETVIRT-974&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;https://jira.opendaylight.org/browse/NETVIRT-974&lt;/a&gt; ?&lt;/p&gt;

&lt;p&gt;no, not at all. But it could turn out to have one and the same single cause  as &lt;a href=&quot;https://jira.opendaylight.org/browse/GENIUS-97&quot; title=&quot;IdPoolListener OOM&quot; class=&quot;issue-link&quot; data-issue-key=&quot;GENIUS-97&quot;&gt;&lt;del&gt;GENIUS-97&lt;/del&gt;&lt;/a&gt; though - we don&apos;t know yet.&lt;/p&gt;

&lt;p&gt;&amp;gt; Is this truly a blocker for Nitrogen-SR1? Thanks!&lt;/p&gt;

&lt;p&gt;Yup.&lt;/p&gt;</comment>
                            <comment id="59970" author="vorburger" created="Tue, 7 Nov 2017 15:17:42 +0000"  >&lt;p&gt;Stack trace just attached to &lt;a href=&quot;https://jira.opendaylight.org/browse/GENIUS-97&quot; title=&quot;IdPoolListener OOM&quot; class=&quot;issue-link&quot; data-issue-key=&quot;GENIUS-97&quot;&gt;&lt;del&gt;GENIUS-97&lt;/del&gt;&lt;/a&gt; shows a lot of DataStoreJobCoordinator ...&lt;/p&gt;</comment>
                            <comment id="59977" author="vorburger" created="Tue, 7 Nov 2017 17:01:58 +0000"  >&lt;p&gt;This can only be reproduced with latest stable/Nitrogen HEAD (which will be SR1), NOT with the first September 26 Nitro, so recently broke.&lt;/p&gt;</comment>
                            <comment id="59986" author="klou" created="Tue, 7 Nov 2017 22:40:57 +0000"  >&lt;p&gt;Do we have ETA on resolution?  Need input to assess how far we have to push out Nitrogen-SR1.  Thanks!&lt;/p&gt;</comment>
                            <comment id="59992" author="vorburger" created="Wed, 8 Nov 2017 02:02:55 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.opendaylight.org/secure/ViewProfile.jspa?name=klou&quot; class=&quot;user-hover&quot; rel=&quot;klou&quot;&gt;klou&lt;/a&gt; ETA is when it&apos;s Fixed. We can try to do earlier then when it&apos;s Done, but we would need a time machine.&lt;/p&gt;</comment>
                            <comment id="59999" author="vorburger" created="Wed, 8 Nov 2017 20:31:53 +0000"  >&lt;p&gt;Closing as CANNOT REPRO, because &lt;a href=&quot;https://jira.opendaylight.org/secure/ViewProfile.jspa?name=ltomasbo&quot; class=&quot;user-hover&quot; rel=&quot;ltomasbo&quot;&gt;ltomasbo&lt;/a&gt;  has clarified that he only hits an OOM (reproducible) on Nitrogen 0.7.0 and 0.7.1 (=SP1) with Xmx 512 MB heap, instead of the default 2 GB, using which ie works for him. The 512 MB  is the default when deploying ODL with devstack without specifying a different Xmx. We&apos;re proposing to fix that in &lt;a href=&quot;https://review.openstack.org/#/c/518540/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.openstack.org/#/c/518540/&lt;/a&gt; to avoid future confusion.&lt;/p&gt;</comment>
                            <comment id="60001" author="vorburger" created="Wed, 8 Nov 2017 20:46:55 +0000"  >&lt;p&gt;PS: We&apos;ll be adding proper JobCoordinator monitor-ability via &lt;a href=&quot;https://jira.opendaylight.org/browse/INFRAUTILS-19&quot; title=&quot;Coda Hale Dropwizard Metrics integration&quot; class=&quot;issue-link&quot; data-issue-key=&quot;INFRAUTILS-19&quot;&gt;&lt;del&gt;INFRAUTILS-19&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10000">
                    <name>Blocks</name>
                                                                <inwardlinks description="is blocked by">
                                        <issuelink>
            <issuekey id="28698">INFRAUTILS-24</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10003">
                    <name>Relates</name>
                                            <outwardlinks description="relates to">
                                        <issuelink>
            <issuekey id="28687">INFRAUTILS-19</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="14213" name="java_pid22161_Leak_Suspects.zip" size="131361" author="vorburger" created="Fri, 3 Nov 2017 21:52:00 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                            <customfield id="customfield_11400" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_10202" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Priority</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10313"><![CDATA[Highest]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10000" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>0|i0378v:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>