<!-- 
RSS generated by JIRA (9.7.1#970001-sha1:2222b88b221c4928ef0de3161136cc90c8356a66) at Thu Feb 08 03:14:48 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>MongoDB Jira</title>
    <link>https://jira.mongodb.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.7.1</version>
        <build-number>970001</build-number>
        <build-date>13-04-2023</build-date>
    </build-info>


<item>
            <title>[SERVER-7529] collection grows unexpectedly large</title>
                <link>https://jira.mongodb.org/browse/SERVER-7529</link>
                <project id="10000" key="SERVER">Core Server</project>
                    <description>&lt;p&gt;We use mongo 2.2.0, replica set of 3 instances, no sharding.&lt;br/&gt;
Seems, 44 times growth definitely looks like a bug, not a feature.&lt;br/&gt;
Collection is used as a fast cache, so it is write/remove intensive.&lt;br/&gt;
After we experienced this problem, we started to use power of 2 sizes. But it didn&apos;t help.&lt;/p&gt;

&lt;p&gt;db.stats(1024*1024*1024);&lt;br/&gt;
{&lt;br/&gt;
	&quot;db&quot; : &quot;image-url&quot;,&lt;br/&gt;
	&quot;collections&quot; : 10,&lt;br/&gt;
	&quot;objects&quot; : 3324847,&lt;br/&gt;
	&quot;avgObjSize&quot; : 401.2754499680737,&lt;br/&gt;
	&quot;dataSize&quot; : 1,&lt;br/&gt;
	&quot;storageSize&quot; : 44,&lt;br/&gt;
	&quot;numExtents&quot; : 64,&lt;br/&gt;
	&quot;indexes&quot; : 12,&lt;br/&gt;
	&quot;indexSize&quot; : 0,&lt;br/&gt;
	&quot;fileSize&quot; : 51,&lt;br/&gt;
	&quot;nsSizeMB&quot; : 16,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;</description>
                <environment></environment>
        <key id="54990">SERVER-7529</key>
            <summary>collection grows unexpectedly large</summary>
                <type id="1" iconUrl="https://jira.mongodb.org/secure/viewavatar?size=xsmall&amp;avatarId=14703&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.mongodb.org/images/icons/priorities/major.svg">Major - P3</priority>
                        <status id="6" iconUrl="https://jira.mongodb.org/images/icons/statuses/closed.png" description="The issue is considered finished, the resolution is correct. Issues which are closed can be reopened.">Closed</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="9">Done</resolution>
                                        <assignee username="milkie@mongodb.com">Eric Milkie</assignee>
                                    <reporter username="gabol">Anton V. Volokhov</reporter>
                        <labels>
                    </labels>
                <created>Thu, 1 Nov 2012 12:49:39 +0000</created>
                <updated>Fri, 15 Feb 2013 15:06:50 +0000</updated>
                            <resolved>Fri, 9 Nov 2012 15:01:28 +0000</resolved>
                                                                                        <votes>1</votes>
                                    <watches>6</watches>
                                                                                                                <comments>
                            <comment id="183038" author="milkie" created="Tue, 6 Nov 2012 16:21:08 +0000"  >&lt;p&gt;The current MongoDB storage engine design does not handle certain workloads very efficiently with respect to fragmentation.  With PowerOf2Sizes, some of the fragmentation issues are ameliorated.  So for your collection image-url.pictures, I think you&apos;ll see much slower growth, if any, if you turn on that feature.  &lt;/p&gt;</comment>
                            <comment id="183029" author="gabol" created="Tue, 6 Nov 2012 16:13:12 +0000"  >&lt;p&gt;I didn&apos;t set usePowerOf2Sizes flag.&lt;br/&gt;
The issue is that collection image-url.pictures is repeatedly growing up to 40-50GB with actual &quot;size&quot; of 1-2GB every 2-3monthes.&lt;br/&gt;
PowerOf2Sizes was not used, I apologize for the confusion.&lt;/p&gt;</comment>
                            <comment id="182988" author="milkie" created="Tue, 6 Nov 2012 14:45:21 +0000"  >&lt;p&gt;Hi Anton.&lt;br/&gt;
I&apos;m still not sure where you&apos;ve set the usePowerOf2Sizes flag.  Your last comment shows userFlags is 0 for image-url.pictures.&lt;/p&gt;</comment>
                            <comment id="182955" author="gabol" created="Tue, 6 Nov 2012 13:01:52 +0000"  >&lt;p&gt;Ooops. Sorry, I set in in dev instance. But still. The collection keeps growing:&lt;br/&gt;
{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.pictures&quot;,&lt;br/&gt;
	&quot;count&quot; : 3134045,&lt;br/&gt;
	&quot;size&quot; : 1257568172,&lt;br/&gt;
	&quot;avgObjSize&quot; : 401.2604069182159,&lt;br/&gt;
	&quot;storageSize&quot; : 52233957040,&lt;br/&gt;
	&quot;numExtents&quot; : 45,&lt;br/&gt;
	&quot;nindexes&quot; : 2,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 2146426864,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 253619520,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 121479008,
		&quot;_h_1&quot; : 132140512
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;br/&gt;
it gained two more GBs in four days.&lt;/p&gt;</comment>
                            <comment id="182060" author="milkie" created="Fri, 2 Nov 2012 19:34:49 +0000"  >&lt;p&gt;For usePowerOf2Sizes to be active on a collection, the &quot;userFlags&quot; field should be at least 1.  Can you confirm you set the flag correctly?&lt;/p&gt;</comment>
                            <comment id="182045" author="gabol" created="Fri, 2 Nov 2012 19:01:59 +0000"  >&lt;p&gt;I have one worker collection (pictures) and a bunch of tiny helper collections:&lt;br/&gt;
{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.pictures&quot;,&lt;br/&gt;
	&quot;count&quot; : 3268394,&lt;br/&gt;
	&quot;size&quot; : 1310752036,&lt;br/&gt;
	&quot;avgObjSize&quot; : 401.0385638940715,&lt;br/&gt;
	&quot;storageSize&quot; : 50087530176,&lt;br/&gt;
	&quot;numExtents&quot; : 44,&lt;br/&gt;
	&quot;nindexes&quot; : 2,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 2146426864,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 244037248,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 122460128,
		&quot;_h_1&quot; : 121577120
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;

&lt;p&gt;{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.clusterizer&quot;,&lt;br/&gt;
	&quot;count&quot; : 2048,&lt;br/&gt;
	&quot;size&quot; : 53240,&lt;br/&gt;
	&quot;avgObjSize&quot; : 25.99609375,&lt;br/&gt;
	&quot;storageSize&quot; : 348160,&lt;br/&gt;
	&quot;numExtents&quot; : 4,&lt;br/&gt;
	&quot;nindexes&quot; : 1,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 262144,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 73584,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 73584
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;

&lt;p&gt;{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.ext-data.chunks&quot;,&lt;br/&gt;
	&quot;count&quot; : 0,&lt;br/&gt;
	&quot;size&quot; : 0,&lt;br/&gt;
	&quot;storageSize&quot; : 8192,&lt;br/&gt;
	&quot;numExtents&quot; : 1,&lt;br/&gt;
	&quot;nindexes&quot; : 2,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 8192,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 16352,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 8176,
		&quot;files_id_1_n_1&quot; : 8176
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;br/&gt;
{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.ext-data.files&quot;,&lt;br/&gt;
	&quot;count&quot; : 0,&lt;br/&gt;
	&quot;size&quot; : 0,&lt;br/&gt;
	&quot;storageSize&quot; : 8192,&lt;br/&gt;
	&quot;numExtents&quot; : 1,&lt;br/&gt;
	&quot;nindexes&quot; : 2,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 8192,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 16352,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 8176,
		&quot;filename_1_uploadDate_1&quot; : 8176
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;

&lt;p&gt;{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.indexConverter&quot;,&lt;br/&gt;
	&quot;count&quot; : 2048,&lt;br/&gt;
	&quot;size&quot; : 53280,&lt;br/&gt;
	&quot;avgObjSize&quot; : 26.015625,&lt;br/&gt;
	&quot;storageSize&quot; : 348160,&lt;br/&gt;
	&quot;numExtents&quot; : 4,&lt;br/&gt;
	&quot;nindexes&quot; : 1,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 262144,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 73584,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 73584
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;

&lt;p&gt;{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.partition&quot;,&lt;br/&gt;
	&quot;count&quot; : 2048,&lt;br/&gt;
	&quot;size&quot; : 53280,&lt;br/&gt;
	&quot;avgObjSize&quot; : 26.015625,&lt;br/&gt;
	&quot;storageSize&quot; : 348160,&lt;br/&gt;
	&quot;numExtents&quot; : 4,&lt;br/&gt;
	&quot;nindexes&quot; : 1,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 262144,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 89936,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 89936
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;br/&gt;
{&lt;br/&gt;
	&quot;sharded&quot; : false,&lt;br/&gt;
	&quot;primary&quot; : &quot;mongodb-sh2&quot;,&lt;br/&gt;
	&quot;ns&quot; : &quot;image-url.unifier&quot;,&lt;br/&gt;
	&quot;count&quot; : 2048,&lt;br/&gt;
	&quot;size&quot; : 53240,&lt;br/&gt;
	&quot;avgObjSize&quot; : 25.99609375,&lt;br/&gt;
	&quot;storageSize&quot; : 348160,&lt;br/&gt;
	&quot;numExtents&quot; : 4,&lt;br/&gt;
	&quot;nindexes&quot; : 1,&lt;br/&gt;
	&quot;lastExtentSize&quot; : 262144,&lt;br/&gt;
	&quot;paddingFactor&quot; : 1,&lt;br/&gt;
	&quot;systemFlags&quot; : 1,&lt;br/&gt;
	&quot;userFlags&quot; : 0,&lt;br/&gt;
	&quot;totalIndexSize&quot; : 73584,&lt;br/&gt;
	&quot;indexSizes&quot; : &lt;/p&gt;
{
		&quot;_id_&quot; : 73584
	}
&lt;p&gt;,&lt;br/&gt;
	&quot;ok&quot; : 1&lt;br/&gt;
}&lt;/p&gt;</comment>
                            <comment id="181969" author="milkie" created="Fri, 2 Nov 2012 16:58:00 +0000"  >&lt;p&gt;Hi Anton.&lt;br/&gt;
Can you attach the output from running stats() on each of your collections in the image-url database?&lt;/p&gt;</comment>
                            <comment id="181968" author="gabol" created="Fri, 2 Nov 2012 16:56:48 +0000"  >&lt;p&gt;So, repair worked as expected. The collection have been growing to this volume for a month or two.&lt;/p&gt;</comment>
                            <comment id="181805" author="gabol" created="Fri, 2 Nov 2012 10:08:42 +0000"  >&lt;p&gt;first, I&apos;ve made a repair, then modified the collection.&lt;/p&gt;</comment>
                            <comment id="181475" author="eliot" created="Thu, 1 Nov 2012 16:36:51 +0000"  >&lt;p&gt;Did you start a new collection or repair after switch to power of 2?&lt;br/&gt;
Just switching won&apos;t fix the old fragmentation.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                <customfield id="customfield_10050" key="com.atlassian.jira.toolkit:comments">
                        <customfieldname># Replies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10.0</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                <customfield id="customfield_10055" key="com.atlassian.jira.ext.charting:firstresponsedate">
                        <customfieldname>Date of 1st Reply</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Thu, 1 Nov 2012 16:36:51 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10052" key="com.atlassian.jira.toolkit:dayslastcommented">
                        <customfieldname>Days since reply</customfieldname>
                        <customfieldvalues>
                                        11 years, 15 weeks, 1 day ago
    
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_18254" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Dependencies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[]]></customfieldvalue>


                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_15850" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_10057" key="com.atlassian.jira.toolkit:lastusercommented">
                        <customfieldname>Last comment by Customer</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>false</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10056" key="com.atlassian.jira.toolkit:lastupdaterorcommenter">
                        <customfieldname>Last commenter</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>ian@mongodb.com</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_11151" key="com.atlassian.jira.toolkit:LastCommentDate">
                        <customfieldname>Last public comment date</customfieldname>
                        <customfieldvalues>
                            11 years, 15 weeks, 1 day ago
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10000" key="com.atlassian.jira.plugin.system.customfieldtypes:radiobuttons">
                        <customfieldname>Old_Backport</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10000"><![CDATA[No]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10032" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Operating System</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10026"><![CDATA[ALL]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_10051" key="com.atlassian.jira.toolkit:participants">
                        <customfieldname>Participants</customfieldname>
                        <customfieldvalues>
                                        <customfieldvalue>gabol</customfieldvalue>
            <customfieldvalue>eliot</customfieldvalue>
            <customfieldvalue>milkie@mongodb.com</customfieldvalue>
    
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                        <customfield id="customfield_14254" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Product Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hrnj9b:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_12550" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>2|hrkc0n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10558" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>32372</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_23361" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Requested By</customfieldname>
                        <customfieldvalues>
                                

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10053" key="com.atlassian.jira.ext.charting:timeinstatus">
                        <customfieldname>Time In Status</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_22870" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Triagers</customfieldname>
                        <customfieldvalues>
                                

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_14350" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>serverRank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|ht069r:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                    </customfields>
    </item>
</channel>
</rss>