Question

我有一个大型数据库和一些复合索引。问题是，mongo不使用索引中的所有字段进行查询，它只使用4个中的2个字段，即使所有4个字段都在复合索引中。或者它使用3场复合索引而不是4场。

这是我的架构（数据和元数据中还有其他字段，但在此查询中不使用它们）：

{
    store_id: {type: String},
    data: {
        id: {type: Number},
    },
    meta: {
        is_published: {type: Boolean},
        lowercase_sku: {type: String}
    }
}

我有这些索引：

db.products.createIndex({'store_id':1,'meta.is_published':1,'data.id':1})
db.products.createIndex({'store_id':1,'meta.is_published':1,'data.id':1,'meta.lowercase_sku':1})

这是我的问题：

db.products.find({
    'store_id': 'my_domain.com',
    'meta.lowercase_sku': 'go-a83-3034/8+4',
    'meta.is_published': true, 
    'data.id': {'$ne': 7801040323}
}).explain('executionStats')

以下是我从解释中获得的信息：

{
    "queryPlanner" : {
        "plannerVersion" : 1,
        "namespace" : "my_database.products",
        "indexFilterSet" : false,
        "parsedQuery" : {
            "$and" : [
                {
                    "meta.is_published" : {
                        "$eq" : true
                    }
                },
                {
                    "meta.lowercase_sku" : {
                        "$eq" : "go-a83-3034/8+4"
                    }
                },
                {
                    "store_id" : {
                        "$eq" : "my_domain.com"
                    }
                },
                {
                    "$not" : {
                        "data.id" : {
                            "$eq" : 7801040323
                        }
                    }
                }
            ]
        },
        "winningPlan" : {
            "stage" : "FETCH",
            "filter" : {
                "meta.lowercase_sku" : {
                    "$eq" : "go-a83-3034/8+4"
                }
            },
            "inputStage" : {
                "stage" : "IXSCAN",
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "data.id" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_data.id_1",
                "isMultiKey" : false,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "data.id" : [
                        "[MinKey, 7801040323.0)",
                        "(7801040323.0, MaxKey]"
                    ]
                }
            }
        },
        "rejectedPlans" : [
            {
                "stage" : "FETCH",
                "filter" : {
                    "$and" : [
                        {
                            "$not" : {
                                "data.id" : {
                                    "$eq" : 7801040323
                                }
                            }
                        },
                        {
                            "meta.lowercase_sku" : {
                                "$eq" : "go-a83-3034/8+4"
                            }
                        }
                    ]
                },
                "inputStage" : {
                    "stage" : "IXSCAN",
                    "keyPattern" : {
                        "store_id" : 1,
                        "meta.is_published" : 1,
                        "data.id" : 1,
                        "meta.lowercase_sku" : 1
                    },
                    "indexName" : "store_id_1_meta.is_published_1_data.id_1_meta.lowercase_sku_1",
                    "isMultiKey" : true,
                    "isUnique" : false,
                    "isSparse" : false,
                    "isPartial" : false,
                    "indexVersion" : 1,
                    "direction" : "forward",
                    "indexBounds" : {
                        "store_id" : [
                            "[\"my_domain.com\", \"my_domain.com\"]"
                        ],
                        "meta.is_published" : [
                            "[true, true]"
                        ],
                        "data.id" : [
                            "[MinKey, 7801040323.0)",
                            "(7801040323.0, MaxKey]"
                        ],
                        "meta.lowercase_sku" : [
                            "[MinKey, MaxKey]"
                        ]
                    }
                }
            }
        ]
    },
    "executionStats" : {
        "executionSuccess" : true,
        "nReturned" : 1,
        "executionTimeMillis" : 4590,
        "totalKeysExamined" : 28527,
        "totalDocsExamined" : 28525,
        "executionStages" : {
            "stage" : "FETCH",
            "filter" : {
                "meta.lowercase_sku" : {
                    "$eq" : "go-a83-3034/8+4"
                }
            },
            "nReturned" : 1,
            "executionTimeMillisEstimate" : 130,
            "works" : 28528,
            "advanced" : 1,
            "needTime" : 28525,
            "needYield" : 0,
            "saveState" : 5351,
            "restoreState" : 5351,
            "isEOF" : 1,
            "invalidates" : 0,
            "docsExamined" : 28525,
            "alreadyHasObj" : 0,
            "inputStage" : {
                "stage" : "IXSCAN",
                "nReturned" : 28525,
                "executionTimeMillisEstimate" : 70,
                "works" : 28527,
                "advanced" : 28525,
                "needTime" : 1,
                "needYield" : 0,
                "saveState" : 5351,
                "restoreState" : 5351,
                "isEOF" : 1,
                "invalidates" : 0,
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "data.id" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_data.id_1",
                "isMultiKey" : false,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "data.id" : [
                        "[MinKey, 7801040323.0)",
                        "(7801040323.0, MaxKey]"
                    ]
                },
                "keysExamined" : 28527,
                "dupsTested" : 0,
                "dupsDropped" : 0,
                "seenInvalidated" : 0
            }
        }
    },
    "serverInfo" : {
        "version" : "3.2.18",
        "gitVersion" : "4c1bae566c0c00f996a2feb16febf84936ecaf6f"
    },
    "ok" : 1
}

正如你所看到的，由于某些原因mongo不使用4字段索引，即使我提示索引，它只使用两个第一个字段（＆＃34; store_id＆＃34;和＆＃34; meta .is_published＆＃34）。它往往选择3个字段的索引，它只包含3个字段（＆＃34; store_id＆＃34;，＆＃34; meta.is_published＆＃34;＆＃34; data.id＆＃34;），这有点意义，如果从4字段索引中仅使用2个字段。但为什么呢？

有人可以向我解释一下这个问题，并且可能暗示如何让查询更快地运行？

数据库很大（大约11 G）并且它最近被迁移（使用索引导入），如果这有帮助的话。但是，有问题的索引是在导入后创建的。

UPD（2）：我还创建了具有相同模式和索引的文档的测试集合。并且相同的查询确实正确地使用了索引。所以我倾向于认为索引大小或值类型存在某种问题。但我还是不能说它。

对此我提供的任何帮助或见解都非常重要。

下面是带有4字段索引提示的查询以及您引用的结果。

db.products.find({
    'store_id': 'my_domain.com',
    'meta.lowercase_sku': 'go-a83-3034/8+4',
    'meta.is_published': true, 
    'data.id': {'$ne': 7801040323}
}).hint('store_id_1_meta.is_published_1_data.id_1_meta.lowercase_sku_1').explain('executionStats')

结果：

{
    "queryPlanner" : {
        "plannerVersion" : 1,
        "namespace" : "sharp_production.products",
        "indexFilterSet" : false,
        "parsedQuery" : {
            "$and" : [
                {
                    "meta.is_published" : {
                        "$eq" : true
                    }
                },
                {
                    "meta.lowercase_sku" : {
                        "$eq" : "go-a83-3034/8+4"
                    }
                },
                {
                    "store_id" : {
                        "$eq" : "my_domain.com"
                    }
                },
                {
                    "$not" : {
                        "data.id" : {
                            "$eq" : 7801040323
                        }
                    }
                }
            ]
        },
        "winningPlan" : {
            "stage" : "FETCH",
            "filter" : {
                "$and" : [
                    {
                        "$not" : {
                            "data.id" : {
                                "$eq" : 7801040323
                            }
                        }
                    },
                    {
                        "meta.lowercase_sku" : {
                            "$eq" : "go-a83-3034/8+4"
                        }
                    }
                ]
            },
            "inputStage" : {
                "stage" : "IXSCAN",
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "data.id" : 1,
                    "meta.lowercase_sku" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_data.id_1_meta.lowercase_sku_1",
                "isMultiKey" : true,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "data.id" : [
                        "[MinKey, 7801040323.0)",
                        "(7801040323.0, MaxKey]"
                    ],
                    "meta.lowercase_sku" : [
                        "[MinKey, MaxKey]"
                    ]
                }
            }
        },
        "rejectedPlans" : [ ]
    },
    "executionStats" : {
        "executionSuccess" : true,
        "nReturned" : 1,
        "executionTimeMillis" : 213,
        "totalKeysExamined" : 28630,
        "totalDocsExamined" : 28525,
        "executionStages" : {
            "stage" : "FETCH",
            "filter" : {
                "$and" : [
                    {
                        "$not" : {
                            "data.id" : {
                                "$eq" : 7801040323
                            }
                        }
                    },
                    {
                        "meta.lowercase_sku" : {
                            "$eq" : "go-a83-3034/8+4"
                        }
                    }
                ]
            },
            "nReturned" : 1,
            "executionTimeMillisEstimate" : 210,
            "works" : 28630,
            "advanced" : 1,
            "needTime" : 28628,
            "needYield" : 0,
            "saveState" : 223,
            "restoreState" : 223,
            "isEOF" : 1,
            "invalidates" : 0,
            "docsExamined" : 28525,
            "alreadyHasObj" : 0,
            "inputStage" : {
                "stage" : "IXSCAN",
                "nReturned" : 28525,
                "executionTimeMillisEstimate" : 110,
                "works" : 28630,
                "advanced" : 28525,
                "needTime" : 104,
                "needYield" : 0,
                "saveState" : 223,
                "restoreState" : 223,
                "isEOF" : 1,
                "invalidates" : 0,
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "data.id" : 1,
                    "meta.lowercase_sku" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_data.id_1_meta.lowercase_sku_1",
                "isMultiKey" : true,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "data.id" : [
                        "[MinKey, 7801040323.0)",
                        "(7801040323.0, MaxKey]"
                    ],
                    "meta.lowercase_sku" : [
                        "[MinKey, MaxKey]"
                    ]
                },
                "keysExamined" : 28630,
                "dupsTested" : 28628,
                "dupsDropped" : 103,
                "seenInvalidated" : 0
            }
        }
    },
    "serverInfo" : {
        "version" : "3.2.18",
        "gitVersion" : "4c1bae566c0c00f996a2feb16febf84936ecaf6f"
    },
    "ok" : 1
}

更新（1）

好吧，显然＆＃34; $ ne＆＃34;运营商可能会破坏指数，就像@JohnnyHK所说的那样。所以我创建了另一个这样的：

db.products.createIndex({'store_id':1,'meta.is_published':1,'meta.lowercase_sku':1})

...并在删除＆＃34; $ ne＆＃34;后尝试将其用于我的查询（它只是一个文件，并没有真正改变任何东西）：

db.products.find({
    'store_id': 'my_domain.com',
    'meta.is_published': true,
    'meta.lowercase_sku': 'go-a83-3034/8+4',
}).hint('store_id_1_meta.is_published_1_meta.lowercase_sku_1').explain('executionStats')

但这次是我这次得到的：

{
    "queryPlanner" : {
        "plannerVersion" : 1,
        "namespace" : "sharp_production.products",
        "indexFilterSet" : false,
        "parsedQuery" : {
            "$and" : [
                {
                    "meta.is_published" : {
                        "$eq" : true
                    }
                },
                {
                    "meta.lowercase_sku" : {
                        "$eq" : "go-a83-3034/8+4"
                    }
                },
                {
                    "store_id" : {
                        "$eq" : "my_domain.com"
                    }
                }
            ]
        },
        "winningPlan" : {
            "stage" : "FETCH",
            "filter" : {
                "meta.lowercase_sku" : {
                    "$eq" : "go-a83-3034/8+4"
                }
            },
            "inputStage" : {
                "stage" : "IXSCAN",
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "meta.lowercase_sku" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_meta.lowercase_sku_1",
                "isMultiKey" : true,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "meta.lowercase_sku" : [
                        "[MinKey, MaxKey]"
                    ]
                }
            }
        },
        "rejectedPlans" : [ ]
    },
    "executionStats" : {
        "executionSuccess" : true,
        "nReturned" : 1,
        "executionTimeMillis" : 136,
        "totalKeysExamined" : 28629,
        "totalDocsExamined" : 28526,
        "executionStages" : {
            "stage" : "FETCH",
            "filter" : {
                "meta.lowercase_sku" : {
                    "$eq" : "go-a83-3034/8+4"
                }
            },
            "nReturned" : 1,
            "executionTimeMillisEstimate" : 120,
            "works" : 28630,
            "advanced" : 1,
            "needTime" : 28628,
            "needYield" : 0,
            "saveState" : 223,
            "restoreState" : 223,
            "isEOF" : 1,
            "invalidates" : 0,
            "docsExamined" : 28526,
            "alreadyHasObj" : 0,
            "inputStage" : {
                "stage" : "IXSCAN",
                "nReturned" : 28526,
                "executionTimeMillisEstimate" : 30,
                "works" : 28630,
                "advanced" : 28526,
                "needTime" : 103,
                "needYield" : 0,
                "saveState" : 223,
                "restoreState" : 223,
                "isEOF" : 1,
                "invalidates" : 0,
                "keyPattern" : {
                    "store_id" : 1,
                    "meta.is_published" : 1,
                    "meta.lowercase_sku" : 1
                },
                "indexName" : "store_id_1_meta.is_published_1_meta.lowercase_sku_1",
                "isMultiKey" : true,
                "isUnique" : false,
                "isSparse" : false,
                "isPartial" : false,
                "indexVersion" : 1,
                "direction" : "forward",
                "indexBounds" : {
                    "store_id" : [
                        "[\"my_domain.com\", \"my_domain.com\"]"
                    ],
                    "meta.is_published" : [
                        "[true, true]"
                    ],
                    "meta.lowercase_sku" : [
                        "[MinKey, MaxKey]"
                    ]
                },
                "keysExamined" : 28629,
                "dupsTested" : 28629,
                "dupsDropped" : 103,
                "seenInvalidated" : 0
            }
        }
    },
    "serverInfo" : {
        "version" : "3.2.18",
        "gitVersion" : "4c1bae566c0c00f996a2feb16febf84936ecaf6f"
    },
    "ok" : 1
}

...仍然保持＆＃34; meta.lowercase_sku＆＃34; FETCH阶段的条件，即使它在索引中就在那里。还有更多想法吗？

Answer 1

这是由于查询计划程序如何选择要使用的索引。

问题的要点是你有多个索引可以满足查询。假设您有两个具有相同前缀的索引：

db.test.createIndex({a:1, b:1})

和

db.test.createIndex({a:1, b:1, c:1})

现在，如果你这样做：

db.test.find({a:1, b:1})

MongoDB如何知道哪个索引可以满足该查询？根据磁盘的布局（在许多方面），一个索引可能比另一个索引更快。

首先，它会使用这个公式对计划进行排名：

score = baseScore + productivity + tieBreakers

当前在MongoDB 3.6.3中，baseScore = 1，productivity取决于计划返回尽可能多的结果所需的工作量，tieBreakers取决于索引是否需要FETCH，没有SORT阶段，或者有索引交集。

如果两个计划给出了相同的分数（就像上面的两个计划一样），那么它就会让他们竞争更快地获得101个结果。获胜计划将被缓存，计划将被执行。可以想象，这可能是非确定性的，也浪费了服务器的时间。最好是服务器可以根据评分系统选择一个索引。

索引集合的最佳方法是删除非必要索引，以确保MongoDB可以立即选择索引。

注意：如果您对细节感兴趣，可以：

使用db.setLogLevel(5,'query')记录查询计划方法，并查看mongod日志中打印的流程。
db.collection.getPlanCache().clear()清除集合的计划缓存。
检查the plan ranker source code。
查看博文Optimizing MongoDB Compound Indexes。

Mongo拒绝使用复合索引

1 个答案: