Loading...

XML

Word

Printable

JSON

Type: Bug
Resolution: Fixed
Priority: Major - P3
Fix Version/s: 8.1.0-rc0
Affects Version/s: 6.0.17, 5.0.29, 8.0.0-rc18, 7.0.14
Component/s: Distributed Query Planning, Sharding
Labels:
None

Assigned Teams:

Query Optimization
Backwards Compatibility:
Fully Compatible
Operating System:
ALL
Backport Requested:

v8.0, v7.0, v6.0, v5.0
Steps To Reproduce:
Hide

I ran the following in the no_passthrough suite.

import {configureFailPoint} from "jstests/libs/fail_point_util.js"; import {ShardingTest} from "jstests/libs/shardingtest.js"; const caseInsensitive = { locale: "en_US", strength: 2 }; // 2 shards. var st = new ShardingTest({shards: 2}); var testDB = st.s.getDB("test"); assert.commandWorked( testDB.adminCommand({enableSharding: testDB.getName(), primaryShard: st.shard0.shardName})); // Create a collection with a case-insensitive default collation sharded on {a: 1}. var collCaseInsensitive = testDB.getCollection("case_insensitive"); collCaseInsensitive.drop(); assert.commandWorked(testDB.createCollection("case_insensitive", {collation: caseInsensitive})); assert.commandWorked(collCaseInsensitive.createIndex({a: 1}, {collation: {locale: "simple"}})); assert.commandWorked(testDB.adminCommand({ shardCollection: collCaseInsensitive.getFullName(), key: {a: 1}, collation: {locale: "simple"} })); // Split the collection. // shard0: [chunk 1] { "a" : { "$minKey" : 1 } } -->> { "a" : 0 } // shard0: [chunk 2] { "a" : 0 } -->> { "a" : "b"} // shard1: [chunk 3] { "a" : "b" } -->> { "a" : { "$maxKey" : 1 }} // Note that we need two chunks on shard0 for this repro. My guess is that its because if we move // all the chunks from shard0 to shard1, we will somehow know to only target shard1 in the query // below. assert.commandWorked( testDB.adminCommand({split: collCaseInsensitive.getFullName(), middle: {a: 0}})); assert.commandWorked( testDB.adminCommand({split: collCaseInsensitive.getFullName(), middle: {a: "b"}})); assert.commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: -1}, to: st.shard0.shardName})); assert.commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "a"}, to: st.shard0.shardName})); assert.commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "c"}, to: st.shard1.shardName})); // Put data on shard0, that will go into chunk 1. const doc = { _id: 0, a: "a" }; assert.commandWorked(collCaseInsensitive.insert(doc)); // Perform a chunk migration of chunk 1 from shard0 to shard1, but do not clean up orphans on // shard0. let suspendRangeDeletionShard0 = configureFailPoint(st.shard0, 'suspendRangeDeletion'); testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "a"}, to: st.shard1.shardName}); // Equality predicate. Since the query has non-simple collation we will have to broadcast to all // shards (since the shard key is on a simple collation index). However, we return the result doc // twice which means we do not properly do shard filtering in this case. const results = collCaseInsensitive.find({a: "a"}).collation(caseInsensitive).toArray(); print("results are ", tojson(results)); assert.eq(results, [doc, doc]); // BAD! DUPLICATE RESULT! suspendRangeDeletionShard0.off(); st.stop();
Show
I ran the following in the no_passthrough suite. import {configureFailPoint} from "jstests/libs/fail_point_util.js" ; import {ShardingTest} from "jstests/libs/shardingtest.js" ; const caseInsensitive = { locale: "en_US" , strength: 2 }; // 2 shards. var st = new ShardingTest({shards: 2}); var testDB = st.s.getDB( "test" ); assert .commandWorked( testDB.adminCommand({enableSharding: testDB.getName(), primaryShard: st.shard0.shardName})); // Create a collection with a case -insensitive default collation sharded on {a: 1}. var collCaseInsensitive = testDB.getCollection( "case_insensitive" ); collCaseInsensitive.drop(); assert .commandWorked(testDB.createCollection( "case_insensitive" , {collation: caseInsensitive})); assert .commandWorked(collCaseInsensitive.createIndex({a: 1}, {collation: {locale: "simple" }})); assert .commandWorked(testDB.adminCommand({ shardCollection: collCaseInsensitive.getFullName(), key: {a: 1}, collation: {locale: "simple" } })); // Split the collection. // shard0: [chunk 1] { "a" : { "$minKey" : 1 } } -->> { "a" : 0 } // shard0: [chunk 2] { "a" : 0 } -->> { "a" : "b" } // shard1: [chunk 3] { "a" : "b" } -->> { "a" : { "$maxKey" : 1 }} // Note that we need two chunks on shard0 for this repro. My guess is that its because if we move // all the chunks from shard0 to shard1, we will somehow know to only target shard1 in the query // below. assert .commandWorked( testDB.adminCommand({split: collCaseInsensitive.getFullName(), middle: {a: 0}})); assert .commandWorked( testDB.adminCommand({split: collCaseInsensitive.getFullName(), middle: {a: "b" }})); assert .commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: -1}, to: st.shard0.shardName})); assert .commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "a" }, to: st.shard0.shardName})); assert .commandWorked(testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "c" }, to: st.shard1.shardName})); // Put data on shard0, that will go into chunk 1. const doc = { _id: 0, a: "a" }; assert .commandWorked(collCaseInsensitive.insert(doc)); // Perform a chunk migration of chunk 1 from shard0 to shard1, but do not clean up orphans on // shard0. let suspendRangeDeletionShard0 = configureFailPoint(st.shard0, 'suspendRangeDeletion' ); testDB.adminCommand( {moveChunk: collCaseInsensitive.getFullName(), find: {a: "a" }, to: st.shard1.shardName}); // Equality predicate. Since the query has non-simple collation we will have to broadcast to all // shards (since the shard key is on a simple collation index). However, we return the result doc // twice which means we do not properly do shard filtering in this case . const results = collCaseInsensitive.find({a: "a" }).collation(caseInsensitive).toArray(); print( "results are " , tojson(results)); assert .eq(results, [doc, doc]); // BAD! DUPLICATE RESULT! suspendRangeDeletionShard0.off(); st.stop();
Sprint:
QO 2024-09-16, QO 2024-09-30, QO 2024-10-14
Linked BF Score:
0

In the case where we have a collection with non-simple default collation, and the collection is sharded on a field where the backing index has a simple collation (what's important here is that its just a different collation from the default collection collation), we cannot do shard targeting for an equality query with a non-simple collation so we broadcast the query to all shards. However, we also do not do shard filtering in this case. So if a chunk migration happens right before the query and the source shard hasn't yet cleaned up orphans, we will return duplicate results. I've attached a more thorough repro in the "steps to reproduce" section.

This happens on master, 8.0, 7.0, 6.0, and 5.0 (i.e. the repro I attached succeeds on all these versions).

is caused by

SERVER-39191 Performance regression for counts post-sharding

Closed

related to

SERVER-94611 Update SHARDING_FILTER logic to support non-simple collation sharding

Open

SERVER-92488 Expand IDHACK eligibility to include {_id: {$eq: <val>}}

Closed

Assignee:: James Harrison

Reporter:: Militsa Sotirova

Participants:: Githook User, James Harrison, Militsa Sotirova

Votes:: 0 Vote for this issue

Watchers:: 17 Start watching this issue

Created:: Aug 30 2024 06:50:19 PM UTC

Updated:: Jan 13 2025 09:42:04 PM UTC

Resolved:: Oct 24 2024 08:07:44 AM UTC

Details

Description

Attachments

Issue Links

Activity

People

Dates