按天分组去重求和_pkey
hive:
select count(DISTINCT(`_pkey`)),rq FROM table where `_pkey` <> '' GROUP BY partion_dt ORDER by rq;
es:
{
"query": {
"bool": {
"filter": [
{
"range": {
"request_time": {
"gte": "2020-04-01T00:00",
"lt": "2020-11-26T23:59"
}
}
},
{
"exists": {
"field": "_pkey"
}
}
]
}
},
"aggs": {
"request_timelist": {
"date_histogram": {
"field": "request_time",
"interval": "1d",
"min_doc_count": 0
},
"aggs": {
"pkcount": {
"cardinality": {
"field": "_pkey"
}
}
}
}
},
"size": 0
}