<!-- 
RSS generated by JIRA (9.7.1#970001-sha1:2222b88b221c4928ef0de3161136cc90c8356a66) at Thu Feb 08 02:54:51 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>MongoDB Jira</title>
    <link>https://jira.mongodb.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.7.1</version>
        <build-number>970001</build-number>
        <build-date>13-04-2023</build-date>
    </build-info>


<item>
            <title>[SERVER-676] use multiple cores for index sort-phase</title>
                <link>https://jira.mongodb.org/browse/SERVER-676</link>
                <project id="10000" key="SERVER">Core Server</project>
                    <description>&lt;p&gt;It would be nice if the external sort for creating an index used multiple cores. &lt;/p&gt;</description>
                <environment></environment>
        <key id="11377">SERVER-676</key>
            <summary>use multiple cores for index sort-phase</summary>
                <type id="4" iconUrl="https://jira.mongodb.org/secure/viewavatar?size=xsmall&amp;avatarId=14710&amp;avatarType=issuetype">Improvement</type>
                                            <priority id="4" iconUrl="https://jira.mongodb.org/images/icons/priorities/minor.svg">Minor - P4</priority>
                        <status id="6" iconUrl="https://jira.mongodb.org/images/icons/statuses/closed.png" description="The issue is considered finished, the resolution is correct. Issues which are closed can be reopened.">Closed</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="12300">Won&apos;t Do</resolution>
                                        <assignee username="backlog-server-execution">Backlog - Storage Execution Team</assignee>
                                    <reporter username="dwight@mongodb.com">Dwight Merriman</reporter>
                        <labels>
                    </labels>
                <created>Thu, 25 Feb 2010 09:29:47 +0000</created>
                <updated>Thu, 7 Dec 2023 09:45:49 +0000</updated>
                            <resolved>Mon, 20 Nov 2023 19:37:37 +0000</resolved>
                                                                    <component>Index Maintenance</component>
                                        <votes>41</votes>
                                    <watches>62</watches>
                                                                                                                <comments>
                            <comment id="5932110" author="bigbourin@gmail.com" created="Thu, 7 Dec 2023 09:45:49 +0000"  >&lt;p&gt;Thanks!&lt;/p&gt;</comment>
                            <comment id="5931322" author="steven.vannelli" created="Wed, 6 Dec 2023 22:46:30 +0000"  >&lt;p&gt;Hi &lt;a href=&quot;https://jira.mongodb.org/secure/ViewProfile.jspa?name=bigbourin%40gmail.com&quot; class=&quot;user-hover&quot; rel=&quot;bigbourin@gmail.com&quot;&gt;bigbourin@gmail.com&lt;/a&gt;, you can follow&#160;&lt;a href=&quot;https://jira.mongodb.org/browse/SERVER-83953&quot; title=&quot;Use parallelism to speed up index builds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;SERVER-83953&quot;&gt;SERVER-83953&lt;/a&gt;. Once the work is done, the team will update that ticket. &#160;&lt;/p&gt;</comment>
                            <comment id="5893932" author="bigbourin@gmail.com" created="Mon, 20 Nov 2023 22:55:33 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.mongodb.org/secure/ViewProfile.jspa?name=steven.vannelli%40mongodb.com&quot; class=&quot;user-hover&quot; rel=&quot;steven.vannelli@mongodb.com&quot;&gt;steven.vannelli@mongodb.com&lt;/a&gt; thanks for the update, is there any ticket were we can follow this index build parallelism feature?&lt;/p&gt;</comment>
                            <comment id="5893326" author="steven.vannelli" created="Mon, 20 Nov 2023 19:37:37 +0000"  >&lt;p&gt;We found some small improvements for index builds but our future plans for index builds use parallelism for the entire process and not just for the sorting phase. &lt;/p&gt;
</comment>
                            <comment id="5776495" author="JIRAUSER1264163" created="Fri, 13 Oct 2023 14:20:02 +0000"  >&lt;p&gt;Putting this back in the backlog as we identified a few ways of improving the throughput of index builds:&lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;&lt;a href=&quot;https://jira.mongodb.org/browse/SERVER-81568&quot; title=&quot;Batch Bulk inserts during the indexing collection scan&quot; class=&quot;issue-link&quot; data-issue-key=&quot;SERVER-81568&quot;&gt;SERVER-81568&lt;/a&gt;&lt;/li&gt;
	&lt;li&gt;&lt;a href=&quot;https://jira.mongodb.org/browse/SERVER-81571&quot; title=&quot;Reconsider stable sort in sorter.cpp&quot; class=&quot;issue-link&quot; data-issue-key=&quot;SERVER-81571&quot;&gt;SERVER-81571&lt;/a&gt;&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;Both of these tickets combined yielded significant improvements without resorting to complete refactors of the index build architecture.&lt;/p&gt;</comment>
                            <comment id="4054572" author="connie.chen" created="Mon, 13 Sep 2021 18:47:55 +0000"  >&lt;p&gt;We can consider this during initial sync, repair, or any other operation that is known to be single-threaded.&#160;&lt;/p&gt;</comment>
                            <comment id="3268132" author="corporate.piyush@gmail.com" created="Thu, 2 Jul 2020 11:47:38 +0000"  >&lt;p&gt;This issue need re-consideration. Also in addition it will be helpful if re-building it does not acquire lock on the collection.&lt;/p&gt;</comment>
                            <comment id="2196819" author="oleg_gritsak" created="Sat, 30 Mar 2019 11:42:26 +0000"  >&lt;p&gt;So sad to see this feature request in low priority queue for almost a decade.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;Speed is the key feature of Mongo for me, and now it is even more important to match opponents. PostgreSQL recently implemented MT-indexing. Oracle can do it for years.&lt;/p&gt;

&lt;p&gt;Had a task to import 20 billions (20.000 millions) of short documents in Mongo and it failed miserable. Batch insert speed is impressive - more than a million of inserts/sec. But creation of index on 2TB collection is going to last forever...&lt;/p&gt;</comment>
                            <comment id="1427803" author="royrez@microsoft.com" created="Mon, 7 Nov 2016 14:02:41 +0000"  >&lt;p&gt;Thanks Eric,&lt;br/&gt;
It might be useful for some usecases, however, sounds to me like sorting the keys during the data copy phase does not change the fact that it will be CPU bound in that phase instead of the index build phase.&lt;br/&gt;
If the issue I was referring to was being IO bound, I can understand how passing through the data only once improves that.&lt;br/&gt;
Regarding the multiple collections, that makes sense, but I still think that for many use-cases like a small # of large collections - it still won&apos;t be good enough.&lt;/p&gt;</comment>
                            <comment id="1427773" author="milkie" created="Mon, 7 Nov 2016 13:24:57 +0000"  >&lt;p&gt;Roy, I believe that other initial sync improvements will have a bigger impact.  Some of these improvements are already implemented for the 3.4 release &amp;#8211; we now sort all the index keys for a collection during the data copy phase, for example, which avoids multiple passes through the data.  Eventually, I would like to see multiple collections cloning simultaneously, which would permit multiple index builds running on multiple cores.&lt;/p&gt;</comment>
                            <comment id="1427251" author="royrez@microsoft.com" created="Sun, 6 Nov 2016 10:01:00 +0000"  >&lt;p&gt;Not sure why this issue is marked as &quot;minor&quot; - it has a huge impact when doing initial sync, which is very slow and single CPU bound in the index build phase...&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Depends</name>
                                            <outwardlinks description="depends on">
                                                        </outwardlinks>
                                                        </issuelinktype>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="139943">SERVER-14154</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10012">
                    <name>Related</name>
                                            <outwardlinks description="related to">
                                        <issuelink>
            <issuekey id="2454703">SERVER-81568</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="2518447">SERVER-83953</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="2454739">SERVER-81571</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="224154">SERVER-19766</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                <customfield id="customfield_10050" key="com.atlassian.jira.toolkit:comments">
                        <customfieldname># Replies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>11.0</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_18555" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname># of Sprints</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1.0</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    <customfield id="customfield_12751" key="com.atlassian.jira.plugin.system.customfieldtypes:multiselect">
                        <customfieldname>Assigned Teams</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="25136"><![CDATA[Storage Execution]]></customfieldvalue>
    
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_13552" key="com.go2group.jira.plugin.crm:crm_generic_field">
                        <customfieldname>Case</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[[500A000000cCoCyIAK, 5002K00000fGPYNQA4, 5002K00000mqyAZQAY, 5002K00000noiYyQAI, 5002K00000nq6GOQAY, 5002K00000s1IQqQAM, 5002K00000tTv8ZQAS, 5006R00001veG30QAE]]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10055" key="com.atlassian.jira.ext.charting:firstresponsedate">
                        <customfieldname>Date of 1st Reply</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Sun, 6 Nov 2016 10:01:00 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10052" key="com.atlassian.jira.toolkit:dayslastcommented">
                        <customfieldname>Days since reply</customfieldname>
                        <customfieldvalues>
                                        8 weeks, 6 days ago
    
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_18254" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Dependencies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[<s><a href='https://jira.mongodb.org/browse/PM-1723'>PM-1723</a></s>]]></customfieldvalue>


                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_15850" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10057" key="com.atlassian.jira.toolkit:lastusercommented">
                        <customfieldname>Last comment by Customer</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>true</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10056" key="com.atlassian.jira.toolkit:lastupdaterorcommenter">
                        <customfieldname>Last commenter</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>bigbourin@gmail.com</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_11151" key="com.atlassian.jira.toolkit:LastCommentDate">
                        <customfieldname>Last public comment date</customfieldname>
                        <customfieldvalues>
                            8 weeks, 6 days ago
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10000" key="com.atlassian.jira.plugin.system.customfieldtypes:radiobuttons">
                        <customfieldname>Old_Backport</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10000"><![CDATA[No]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_10051" key="com.atlassian.jira.toolkit:participants">
                        <customfieldname>Participants</customfieldname>
                        <customfieldvalues>
                                        <customfieldvalue>bigbourin@gmail.com</customfieldvalue>
            <customfieldvalue>backlog-server-execution</customfieldvalue>
            <customfieldvalue>connie.chen@mongodb.com</customfieldvalue>
            <customfieldvalue>dwight@mongodb.com</customfieldvalue>
            <customfieldvalue>milkie@mongodb.com</customfieldvalue>
            <customfieldvalue>jordi.olivares-provencio@mongodb.com</customfieldvalue>
            <customfieldvalue>oleg_gritsak</customfieldvalue>
            <customfieldvalue>corporate.piyush@gmail.com</customfieldvalue>
            <customfieldvalue>royrez@microsoft.com</customfieldvalue>
            <customfieldvalue>steven.vannelli@mongodb.com</customfieldvalue>
    
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                        <customfield id="customfield_14254" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Product Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hrprfj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_12550" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>2|i0i5nn:i</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10558" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>4263</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                <customfield id="customfield_10557" key="com.pyxis.greenhopper.jira:gh-sprint">
                        <customfieldname>Sprint</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue id="7685">Execution EMEA Team 2023-10-02</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10053" key="com.atlassian.jira.ext.charting:timeinstatus">
                        <customfieldname>Time In Status</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_22870" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Triagers</customfieldname>
                        <customfieldvalues>
                                

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_14350" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>serverRank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|ht0ttr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                    </customfields>
    </item>
</channel>
</rss>