【发布时间】:2018-11-23 06:02:52
【问题描述】:
我正在使用 mongodb 3.6,我的收藏中几乎有 5-6 lkhs 文档。我想像全文搜索和部分搜索一样搜索。 `
db.temp.find( {$and : [{"status" : {"$in" : [ 1, 2]} },
{$or:[ { $text: { $search: "school" }}
,{ cname : /school/i}
,{ name : /school/i}
]} ]},
{cname:1,name:1,followers:1,status :1, score: { $meta:
"textScore" } } ).sort( { score: { $meta: "textScore"
},status :-1 ,followers :-1 } )
` 临时集合索引。
db.temp.createIndex(
{
name: "text",
cname: "text"
},
{
weights: {
name: 4,
cname: 2
}
}
)
db.getCollection("temp").createIndex({
"cname": 1
}, {background: true})
db.getCollection("temp").createIndex({
"status" : -1.0,
"followers" : -1.0
}, {background: true});
db.getCollection("temp").createIndex({
"name": 1
}, {background: true})`
文档如下:
{
"_id" : 5011.0,
"cname" : "samyselvik",
"name" : "Samy Sam",
"imgname" : "nrwi4769731443194380996.jpg",
"followers" : 1.0,
"status" : 1.0,
"createdat" : 1443194421532.0
}
当我检查执行('executionStats')时,它显示
"executionStats" :{
"executionSuccess" : true,
"nReturned" : 363.0,
"executionTimeMillis" : 894.0,
"totalKeysExamined" : 921424.0,
"totalDocsExamined" : 372.0,
"executionStages" : {
"stage" : "PROJECTION",
"nReturned" : 363.0,
"executionTimeMillisEstimate" : 808.0,
"works" : 921803.0,
"advanced" : 363.0,
"needTime" : 921439.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"transformBy" : {
"cname" : 1.0,
"name" : 1.0,
"followers" : 1.0,
"score" : {
"$meta" : "textScore"
}
},
"inputStage" : {
"stage" : "SORT",
"nReturned" : 363.0,
"executionTimeMillisEstimate" : 774.0,
"works" : 921803.0,
"advanced" : 363.0,
"needTime" : 921439.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"sortPattern" : {
"score" : {
"$meta" : "textScore"
},
"status" : -1.0,
"followers" : -1.0
},
"memUsage" : 131542.0,
"memLimit" : 33554432.0,
"limitAmount" : 500.0,
"inputStage" : {
"stage" : "SORT_KEY_GENERATOR",
"nReturned" : 363.0,
"executionTimeMillisEstimate" : 730.0,
"works" : 921439.0,
"advanced" : 363.0,
"needTime" : 921075.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"inputStage" : {
"stage" : "FETCH",
"filter" : {
"status" : {
"$in" : [
1.0,
2.0
]
}
},
"nReturned" : 363.0,
"executionTimeMillisEstimate" : 719.0,
"works" : 921438.0,
"advanced" : 363.0,
"needTime" : 921074.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"docsExamined" : 363.0,
"alreadyHasObj" : 9.0,
"inputStage" : {
"stage" : "OR",
"nReturned" : 363.0,
"executionTimeMillisEstimate" : 697.0,
"works" : 921438.0,
"advanced" : 363.0,
"needTime" : 921074.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"dupsTested" : 399.0,
"dupsDropped" : 36.0,
"recordIdsForgotten" : 0.0,
"inputStages" : [
{
"stage" : "TEXT",
"nReturned" : 9.0,
"executionTimeMillisEstimate" : 0.0,
"works" : 21.0,
"advanced" : 9.0,
"needTime" : 11.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"indexPrefix" : {
},
"indexName" : "name_text_cname_text",
"parsedTextQuery" : {
"terms" : [
"sam"
],
"negatedTerms" : [
],
"phrases" : [
],
"negatedPhrases" : [
]
},
"textIndexVersion" : 3.0,
"inputStage" : {
"stage" : "TEXT_MATCH",
"nReturned" : 9.0,
"executionTimeMillisEstimate" : 0.0,
"works" : 21.0,
"advanced" : 9.0,
"needTime" : 11.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"docsRejected" : 0.0,
"inputStage" : {
"stage" : "TEXT_OR",
"nReturned" : 9.0,
"executionTimeMillisEstimate" : 0.0,
"works" : 21.0,
"advanced" : 9.0,
"needTime" : 11.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"docsExamined" : 9.0,
"inputStage" : {
"stage" : "IXSCAN",
"nReturned" : 9.0,
"executionTimeMillisEstimate" : 0.0,
"works" : 10.0,
"advanced" : 9.0,
"needTime" : 0.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"keyPattern" : {
"_fts" : "text",
"_ftsx" : 1.0
},
"indexName" : "name_text_cname_text",
"isMultiKey" : true,
"isUnique" : false,
"isSparse" : false,
"isPartial" : false,
"indexVersion" : 2.0,
"direction" : "backward",
"indexBounds" : {
},
"keysExamined" : 9.0,
"seeks" : 1.0,
"dupsTested" : 9.0,
"dupsDropped" : 0.0,
"seenInvalidated" : 0.0
}
}
}
},
{
"stage" : "IXSCAN",
"filter" : {
"$or" : [
{
"cname" : {
"$regex" : "Sam",
"$options" : "i"
}
}
]
},
"nReturned" : 193.0,
"executionTimeMillisEstimate" : 357.0,
"works" : 460693.0,
"advanced" : 193.0,
"needTime" : 460499.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"keyPattern" : {
"cname" : 1.0
},
"indexName" : "cname_1",
"isMultiKey" : false,
"multiKeyPaths" : {
"cname" : [
]
},
"isUnique" : false,
"isSparse" : false,
"isPartial" : false,
"indexVersion" : 2.0,
"direction" : "forward",
"indexBounds" : {
"cname" : [
"[\"\", {})",
"[/Sam/i, /Sam/i]"
]
},
"keysExamined" : 460692.0,
"seeks" : 1.0,
"dupsTested" : 0.0,
"dupsDropped" : 0.0,
"seenInvalidated" : 0.0
},
{
"stage" : "IXSCAN",
"filter" : {
"$or" : [
{
"name" : {
"$regex" : "Sam",
"$options" : "i"
}
}
]
},
"nReturned" : 197.0,
"executionTimeMillisEstimate" : 318.0,
"works" : 460724.0,
"advanced" : 197.0,
"needTime" : 460526.0,
"needYield" : 0.0,
"saveState" : 7234.0,
"restoreState" : 7234.0,
"isEOF" : 1.0,
"invalidates" : 0.0,
"keyPattern" : {
"name" : 1.0
},
"indexName" : "name_1",
"isMultiKey" : false,
"multiKeyPaths" : {
"name" : [
]
},
"isUnique" : false,
"isSparse" : false,
"isPartial" : false,
"indexVersion" : 2.0,
"direction" : "forward",
"indexBounds" : {
"name" : [
"[\"\", {})",
"[/Sam/i, /Sam/i]"
]
},
"keysExamined" : 460723.0,
"seeks" : 1.0,
"dupsTested" : 0.0,
"dupsDropped" : 0.0,
"seenInvalidated" : 0.0
}
]
}
}
}
}
},
"allPlansExecution" : [
]
}
temp Collection 总共有 4.60 lkhs 文档和检查的键比文档更多。请告诉我如何优化此查询,以便我可以使用全文和部分搜索?
【问题讨论】:
-
@AlexBlex 你能解释一下为什么 totalKeysExamined 比文件总数还多吗?
-
@AlexBlex,有什么办法可以优化上述查询,因为我必须更快地搜索?
-
@AlexBlex,文档:{“_id”:5011.0,“cname”:“samyselvik”,“name”:“Samy Sam”,“imgname”:“nrwi4769731443194380996.jpg”,“followers” : 1.0, "status" : 1.0, "createdat" : 1443194421532.0 } 这种类型的文件。 “executionStats”:{“executionSuccess”:真,“nReturned”:363.0,“executionTimeMillis”:894.0,“totalKeysExamined”:921424.0,“totalDocsExamined”:372.0}
-
@AlexBlex,问题已使用文档类型和 executionStats 进行编辑。
标签: mongodb indexing full-text-search query-optimization partial