<!-- 
RSS generated by JIRA (9.7.1#970001-sha1:2222b88b221c4928ef0de3161136cc90c8356a66) at Thu Feb 08 03:17:10 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>MongoDB Jira</title>
    <link>https://jira.mongodb.org</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.7.1</version>
        <build-number>970001</build-number>
        <build-date>13-04-2023</build-date>
    </build-info>


<item>
            <title>[SERVER-8341] Stemming and stop word deletion in phrases</title>
                <link>https://jira.mongodb.org/browse/SERVER-8341</link>
                <project id="10000" key="SERVER">Core Server</project>
                    <description>&lt;p&gt;Having indexed the Enron email dataset, with a two-field text index with default weightings, I&apos;m seeing unexpected behaviour when searching for phrases. It appears terms are being stemmed and stop words removed within a phrase:&lt;/p&gt;

&lt;p&gt;&amp;gt; db.getCollection(&quot;emails&quot;).runCommand(&quot;text&quot;, &lt;/p&gt;
{ &quot;search&quot; : &quot;\&quot;the scrimmage\&quot;&quot;,limit:1 }
&lt;p&gt;);&lt;/p&gt;

&lt;p&gt;&quot;queryDebugString&quot; : &quot;scrimmag||||the scrimmage||&quot;	&lt;/p&gt;

&lt;p&gt;&amp;gt; db.getCollection(&quot;emails&quot;).runCommand(&quot;text&quot;, &lt;/p&gt;
{ &quot;search&quot; : &apos;&quot;the scrimmage&quot;&apos;, limit:1 }
&lt;p&gt;);&lt;/p&gt;

&lt;p&gt;&quot;queryDebugString&quot; : &quot;scrimmag||||the scrimmage||&quot;&lt;/p&gt;

&lt;p&gt;This behaviour was first spotted by a MongoDB user at the FTS Hackathon in London.&lt;/p&gt;</description>
                <environment>Mac OS 10.7.5.&lt;br/&gt;
MongoDB 2.3.2</environment>
        <key id="63303">SERVER-8341</key>
            <summary>Stemming and stop word deletion in phrases</summary>
                <type id="1" iconUrl="https://jira.mongodb.org/secure/viewavatar?size=xsmall&amp;avatarId=14703&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.mongodb.org/images/icons/priorities/critical.svg">Critical - P2</priority>
                        <status id="6" iconUrl="https://jira.mongodb.org/images/icons/statuses/closed.png" description="The issue is considered finished, the resolution is correct. Issues which are closed can be reopened.">Closed</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="9">Done</resolution>
                                        <assignee username="-1">Unassigned</assignee>
                                    <reporter username="matt.bates@10gen.com">Matt Bates</reporter>
                        <labels>
                    </labels>
                <created>Fri, 25 Jan 2013 18:31:32 +0000</created>
                <updated>Tue, 19 Mar 2013 17:02:20 +0000</updated>
                            <resolved>Fri, 1 Feb 2013 18:21:43 +0000</resolved>
                                    <version>2.3.2</version>
                                                    <component>Text Search</component>
                                        <votes>0</votes>
                                    <watches>3</watches>
                                                                                                                <comments>
                            <comment id="253252" author="rassi@10gen.com" created="Tue, 29 Jan 2013 22:40:33 +0000"  >&lt;p&gt;&amp;gt; How would it be possible to search exactly for a phrase - without stop word removal and stemming?&lt;/p&gt;

&lt;p&gt;The phrase search you pasted above will do exactly this.&lt;/p&gt;

&lt;p&gt;Search queries are reduced to a list of stemmed terms, which are used to query into the index.  This list includes words from phrases and also words not inside phrases.  Stopwords are not included.  For your example, this list will be the singleton &lt;tt&gt;(scrimmag)&lt;/tt&gt;. After the results come back from the index, the matcher is invoked to filter out documents that do not include the specified phrases.&lt;/p&gt;

&lt;p&gt;I&apos;ll mark this ticket for review by the docs team.&lt;/p&gt;</comment>
                            <comment id="251792" author="matt.bates@10gen.com" created="Mon, 28 Jan 2013 15:41:37 +0000"  >&lt;p&gt;I read the release notes for 2.4 (2.3.2) and it states that it does not stem phrases or negations. Maybe the documentation is wrong and needs correcting?&lt;/p&gt;

&lt;p&gt;How would it be possible to search exactly for a phrase - without stop word removal and stemming? That&apos;s what was desired in the queries above (&apos;the scrimmage&apos;) and was asked/expected at the hackathon.&lt;/p&gt;
</comment>
                            <comment id="249827" author="eliot" created="Fri, 25 Jan 2013 18:36:09 +0000"  >&lt;p&gt;That is as designed.&lt;br/&gt;
Are you seeing results that are incorrect?&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                <customfield id="customfield_10050" key="com.atlassian.jira.toolkit:comments">
                        <customfieldname># Replies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>3.0</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                <customfield id="customfield_10055" key="com.atlassian.jira.ext.charting:firstresponsedate">
                        <customfieldname>Date of 1st Reply</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Fri, 25 Jan 2013 18:36:09 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10052" key="com.atlassian.jira.toolkit:dayslastcommented">
                        <customfieldname>Days since reply</customfieldname>
                        <customfieldvalues>
                                        11 years, 3 weeks, 1 day ago
    
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_18254" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Dependencies</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue><![CDATA[]]></customfieldvalue>


                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_15850" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_10057" key="com.atlassian.jira.toolkit:lastusercommented">
                        <customfieldname>Last comment by Customer</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>true</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10056" key="com.atlassian.jira.toolkit:lastupdaterorcommenter">
                        <customfieldname>Last commenter</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>ian@mongodb.com</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_11151" key="com.atlassian.jira.toolkit:LastCommentDate">
                        <customfieldname>Last public comment date</customfieldname>
                        <customfieldvalues>
                            11 years, 3 weeks, 1 day ago
                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10000" key="com.atlassian.jira.plugin.system.customfieldtypes:radiobuttons">
                        <customfieldname>Old_Backport</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10000"><![CDATA[No]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10032" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Operating System</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10026"><![CDATA[ALL]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_10051" key="com.atlassian.jira.toolkit:participants">
                        <customfieldname>Participants</customfieldname>
                        <customfieldvalues>
                                        <customfieldvalue>eliot</customfieldvalue>
            <customfieldvalue>rassi</customfieldvalue>
            <customfieldvalue>matt.bates@10gen.com</customfieldvalue>
    
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                        <customfield id="customfield_14254" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Product Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hrn9jz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                <customfield id="customfield_12550" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>2|hrltpr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10558" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>40873</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_23361" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Requested By</customfieldname>
                        <customfieldvalues>
                                

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10053" key="com.atlassian.jira.ext.charting:timeinstatus">
                        <customfieldname>Time In Status</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_22870" key="com.onresolve.jira.groovy.groovyrunner:scripted-field">
                        <customfieldname>Triagers</customfieldname>
                        <customfieldvalues>
                                

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                    <customfield id="customfield_14350" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>serverRank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|ht05dr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                    </customfields>
    </item>
</channel>
</rss>