Here is my query -
{
"from": 0,
"size": 100,
"query": {
"bool": {
"filter": [
{
"terms": {
"folderId.keyword": [
"ff98505e-cdff-43aa-8b05-197bc3f3265e"
],
"boost": 1
}
},
{
"terms": {
"objectType.keyword": [
"File"
],
"boost": 1
}
},
{
"term": {
"tenantId": {
"value": "34202",
"boost": 1
}
}
}
],
"adjust_pure_negative": true,
"boost": 1
}
},
"aggs":{
"_byformat":{
"terms":{
"field":"format.keyword",
"min_doc_count":0,
"size":200
}
}
}
}
result with min_doc_count = 0 -
"took" : 1, "timed_out" : false, "_shards" : { "total" : 1, "successful" : 1, "skipped" : 0, "failed" : 0 }, "hits" : { "total" : 3, "max_score" : 0.0, "hits" : [ { "_index" : "plnesdv1-34202-1", "_type" : "_doc", "_id" : "6adbda83-53ad-457f-a2ab-d5b04c643005", "_score" : 0.0, "_source" : { "format" : "vnd.openxmlformats-officedocument.spreadsheetml.sheet", "externalSharing" : "N", "description" : null, "dateModified" : null, "type" : "application", "folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e", "tags" : [ ], "objectType" : "File", "dateCreated" : null, "name" : "New XLSX file", "tenantId" : "34202", "modifiedBy" : "rdt001", "id" : "6adbda83-53ad-457f-a2ab-d5b04c643005", "status" : "active", "expirationDate" : null } }, { "_index" : "plnesdv1-34202-1", "_type" : "_doc", "_id" : "b1000a15-2d80-41f4-a5df-ba5c27f8e9c6", "_score" : 0.0, "_source" : { "format" : "vnd.ms-excel", "externalSharing" : "N", "description" : null, "dateModified" : null, "type" : "application", "folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e", "tags" : [ ], "objectType" : "File", "dateCreated" : null, "name" : "New XLS file", "tenantId" : "34202", "modifiedBy" : "rdt001", "id" : "b1000a15-2d80-41f4-a5df-ba5c27f8e9c6", "status" : "active", "expirationDate" : null } }, { "_index" : "plnesdv1-34202-1", "_type" : "_doc", "_id" : "630e9f49-3368-408d-a091-03f253127004", "_score" : 0.0, "_source" : { "format" : "msword", "externalSharing" : "N", "description" : null, "dateModified" : null, "type" : "application", "folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e", "tags" : [ ], "objectType" : "File", "dateCreated" : null, "name" : "New DOC file", "tenantId" : "34202", "modifiedBy" : "rdt001", "id" : "630e9f49-3368-408d-a091-03f253127004", "status" : "active", "expirationDate" : null } } ] }, "aggregations" : { "_byformat" : { "doc_count_error_upper_bound" : 0, "sum_other_doc_count" : 0, "buckets" : [ { "key" : "msword", "doc_count" : 1 }, { "key" : "vnd.ms-excel", "doc_count" : 1 }, { "key" : "vnd.openxmlformats-officedocument.spreadsheetml.sheet", "doc_count" : 1 }, { "key" : "bmp", "doc_count" : 0 }, { "key" : "gif", "doc_count" : 0 }, { "key" : "html", "doc_count" : 0 } ] } } }
result with min_doc_count = 1 -
{
"took" : 0,
"timed_out" : false,
"_shards" : {
"total" : 1,
"successful" : 1,
"skipped" : 0,
"failed" : 0
},
"hits" : {
"total" : 3,
"max_score" : 0.0,
"hits" : [
{
"_index" : "plnesdv1-34202-1",
"_type" : "_doc",
"_id" : "6adbda83-53ad-457f-a2ab-d5b04c643005",
"_score" : 0.0,
"_source" : {
"format" : "vnd.openxmlformats-officedocument.spreadsheetml.sheet",
"externalSharing" : "N",
"description" : null,
"dateModified" : null,
"type" : "application",
"folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e",
"tags" : [ ],
"objectType" : "File",
"dateCreated" : null,
"name" : "New XLSX file",
"tenantId" : "34202",
"modifiedBy" : "rdt001",
"id" : "6adbda83-53ad-457f-a2ab-d5b04c643005",
"status" : "active",
"expirationDate" : null
}
},
{
"_index" : "plnesdv1-34202-1",
"_type" : "_doc",
"_id" : "b1000a15-2d80-41f4-a5df-ba5c27f8e9c6",
"_score" : 0.0,
"_source" : {
"format" : "vnd.ms-excel",
"externalSharing" : "N",
"description" : null,
"dateModified" : null,
"type" : "application",
"folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e",
"tags" : [ ],
"objectType" : "File",
"dateCreated" : null,
"name" : "New XLS file",
"tenantId" : "34202",
"modifiedBy" : "rdt001",
"id" : "b1000a15-2d80-41f4-a5df-ba5c27f8e9c6",
"status" : "active",
"expirationDate" : null
}
},
{
"_index" : "plnesdv1-34202-1",
"_type" : "_doc",
"_id" : "630e9f49-3368-408d-a091-03f253127004",
"_score" : 0.0,
"_source" : {
"format" : "msword",
"externalSharing" : "N",
"description" : null,
"dateModified" : null,
"type" : "application",
"folderId" : "ff98505e-cdff-43aa-8b05-197bc3f3265e",
"tags" : [ ],
"objectType" : "File",
"dateCreated" : null,
"name" : "New DOC file",
"tenantId" : "34202",
"modifiedBy" : "rdt001",
"id" : "630e9f49-3368-408d-a091-03f253127004",
"status" : "active",
"expirationDate" : null
}
}
]
},
"aggregations" : {
"_byformat" : {
"doc_count_error_upper_bound" : 0,
"sum_other_doc_count" : 0,
"buckets" : [
{
"key" : "msword",
"doc_count" : 1
},
{
"key" : "vnd.ms-excel",
"doc_count" : 1
},
{
"key" : "vnd.openxmlformats-officedocument.spreadsheetml.sheet",
"doc_count" : 1
}
]
}
}
}
Aggregations are correct when min_doc_count = 1 and only buckets relevant to hits are fetched.
Could anyone tell me why aggregation is fetching all buckets when min_doc_count = 0 is set. I have gone through the elastic search documentation, it states that this behavior is by design, any other way to get aggregation buckets only for hits and with zero count as well.