in utils/es.py [0:0]
def create_index_missing_for_docs(client: Elasticsearch):
"""
Create an index to place all the documents that were updated at least one time.
:param client: ES client.
"""
create_index(client, overwritten_docs_index)
pipelines = IngestClient(client)
pipeline_name = 'get-missing-docs'
pipelines.put_pipeline(id=pipeline_name, body={
'description': "Drop all documents that were not overwritten.",
"processors": [
{
"drop": {
"if": "ctx._version == 1"
}
}
]
})
dest = {
"index": overwritten_docs_index,
"version_type": "external",
"pipeline": pipeline_name
}
client.reindex(source={"index": tsdb_index}, dest=dest, refresh=True)