elasticsearch_serverless/_sync/client/ingest.py (238 lines of code) (raw):
# Licensed to Elasticsearch B.V. under one or more contributor
# license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright
# ownership. Elasticsearch B.V. licenses this file to you under
# the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
import typing as t
from elastic_transport import ObjectApiResponse
from ._base import NamespacedClient
from .utils import SKIP_IN_PATH, _quote, _rewrite_parameters
class IngestClient(NamespacedClient):
@_rewrite_parameters()
def delete_pipeline(
self,
*,
id: str,
error_trace: t.Optional[bool] = None,
filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
human: t.Optional[bool] = None,
master_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
pretty: t.Optional[bool] = None,
timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
) -> ObjectApiResponse[t.Any]:
"""
.. raw:: html
<p>Delete pipelines.
Delete one or more ingest pipelines.</p>
`<https://www.elastic.co/docs/api/doc/elasticsearch/operation/operation-ingest-delete-pipeline>`_
:param id: Pipeline ID or wildcard expression of pipeline IDs used to limit the
request. To delete all ingest pipelines in a cluster, use a value of `*`.
:param master_timeout: Period to wait for a connection to the master node. If
no response is received before the timeout expires, the request fails and
returns an error.
:param timeout: Period to wait for a response. If no response is received before
the timeout expires, the request fails and returns an error.
"""
if id in SKIP_IN_PATH:
raise ValueError("Empty value passed for parameter 'id'")
__path_parts: t.Dict[str, str] = {"id": _quote(id)}
__path = f'/_ingest/pipeline/{__path_parts["id"]}'
__query: t.Dict[str, t.Any] = {}
if error_trace is not None:
__query["error_trace"] = error_trace
if filter_path is not None:
__query["filter_path"] = filter_path
if human is not None:
__query["human"] = human
if master_timeout is not None:
__query["master_timeout"] = master_timeout
if pretty is not None:
__query["pretty"] = pretty
if timeout is not None:
__query["timeout"] = timeout
__headers = {"accept": "application/json"}
return self.perform_request( # type: ignore[return-value]
"DELETE",
__path,
params=__query,
headers=__headers,
endpoint_id="ingest.delete_pipeline",
path_parts=__path_parts,
)
@_rewrite_parameters()
def get_pipeline(
self,
*,
id: t.Optional[str] = None,
error_trace: t.Optional[bool] = None,
filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
human: t.Optional[bool] = None,
master_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
pretty: t.Optional[bool] = None,
summary: t.Optional[bool] = None,
) -> ObjectApiResponse[t.Any]:
"""
.. raw:: html
<p>Get pipelines.</p>
<p>Get information about one or more ingest pipelines.
This API returns a local reference of the pipeline.</p>
`<https://www.elastic.co/docs/api/doc/elasticsearch/operation/operation-ingest-get-pipeline>`_
:param id: Comma-separated list of pipeline IDs to retrieve. Wildcard (`*`) expressions
are supported. To get all ingest pipelines, omit this parameter or use `*`.
:param master_timeout: Period to wait for a connection to the master node. If
no response is received before the timeout expires, the request fails and
returns an error.
:param summary: Return pipelines without their definitions (default: false)
"""
__path_parts: t.Dict[str, str]
if id not in SKIP_IN_PATH:
__path_parts = {"id": _quote(id)}
__path = f'/_ingest/pipeline/{__path_parts["id"]}'
else:
__path_parts = {}
__path = "/_ingest/pipeline"
__query: t.Dict[str, t.Any] = {}
if error_trace is not None:
__query["error_trace"] = error_trace
if filter_path is not None:
__query["filter_path"] = filter_path
if human is not None:
__query["human"] = human
if master_timeout is not None:
__query["master_timeout"] = master_timeout
if pretty is not None:
__query["pretty"] = pretty
if summary is not None:
__query["summary"] = summary
__headers = {"accept": "application/json"}
return self.perform_request( # type: ignore[return-value]
"GET",
__path,
params=__query,
headers=__headers,
endpoint_id="ingest.get_pipeline",
path_parts=__path_parts,
)
@_rewrite_parameters()
def processor_grok(
self,
*,
error_trace: t.Optional[bool] = None,
filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
human: t.Optional[bool] = None,
pretty: t.Optional[bool] = None,
) -> ObjectApiResponse[t.Any]:
"""
.. raw:: html
<p>Run a grok processor.
Extract structured fields out of a single text field within a document.
You must choose which field to extract matched fields from, as well as the grok pattern you expect will match.
A grok pattern is like a regular expression that supports aliased expressions that can be reused.</p>
`<https://www.elastic.co/guide/en/elasticsearch/reference/master/grok-processor.html>`_
"""
__path_parts: t.Dict[str, str] = {}
__path = "/_ingest/processor/grok"
__query: t.Dict[str, t.Any] = {}
if error_trace is not None:
__query["error_trace"] = error_trace
if filter_path is not None:
__query["filter_path"] = filter_path
if human is not None:
__query["human"] = human
if pretty is not None:
__query["pretty"] = pretty
__headers = {"accept": "application/json"}
return self.perform_request( # type: ignore[return-value]
"GET",
__path,
params=__query,
headers=__headers,
endpoint_id="ingest.processor_grok",
path_parts=__path_parts,
)
@_rewrite_parameters(
body_fields=(
"deprecated",
"description",
"meta",
"on_failure",
"processors",
"version",
),
parameter_aliases={"_meta": "meta"},
)
def put_pipeline(
self,
*,
id: str,
deprecated: t.Optional[bool] = None,
description: t.Optional[str] = None,
error_trace: t.Optional[bool] = None,
filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
human: t.Optional[bool] = None,
if_version: t.Optional[int] = None,
master_timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
meta: t.Optional[t.Mapping[str, t.Any]] = None,
on_failure: t.Optional[t.Sequence[t.Mapping[str, t.Any]]] = None,
pretty: t.Optional[bool] = None,
processors: t.Optional[t.Sequence[t.Mapping[str, t.Any]]] = None,
timeout: t.Optional[t.Union[str, t.Literal[-1], t.Literal[0]]] = None,
version: t.Optional[int] = None,
body: t.Optional[t.Dict[str, t.Any]] = None,
) -> ObjectApiResponse[t.Any]:
"""
.. raw:: html
<p>Create or update a pipeline.
Changes made using this API take effect immediately.</p>
`<https://www.elastic.co/guide/en/elasticsearch/reference/master/ingest.html>`_
:param id: ID of the ingest pipeline to create or update.
:param deprecated: Marks this ingest pipeline as deprecated. When a deprecated
ingest pipeline is referenced as the default or final pipeline when creating
or updating a non-deprecated index template, Elasticsearch will emit a deprecation
warning.
:param description: Description of the ingest pipeline.
:param if_version: Required version for optimistic concurrency control for pipeline
updates
:param master_timeout: Period to wait for a connection to the master node. If
no response is received before the timeout expires, the request fails and
returns an error.
:param meta: Optional metadata about the ingest pipeline. May have any contents.
This map is not automatically generated by Elasticsearch.
:param on_failure: Processors to run immediately after a processor failure. Each
processor supports a processor-level `on_failure` value. If a processor without
an `on_failure` value fails, Elasticsearch uses this pipeline-level parameter
as a fallback. The processors in this parameter run sequentially in the order
specified. Elasticsearch will not attempt to run the pipeline's remaining
processors.
:param processors: Processors used to perform transformations on documents before
indexing. Processors run sequentially in the order specified.
:param timeout: Period to wait for a response. If no response is received before
the timeout expires, the request fails and returns an error.
:param version: Version number used by external systems to track ingest pipelines.
This parameter is intended for external systems only. Elasticsearch does
not use or validate pipeline version numbers.
"""
if id in SKIP_IN_PATH:
raise ValueError("Empty value passed for parameter 'id'")
__path_parts: t.Dict[str, str] = {"id": _quote(id)}
__path = f'/_ingest/pipeline/{__path_parts["id"]}'
__query: t.Dict[str, t.Any] = {}
__body: t.Dict[str, t.Any] = body if body is not None else {}
if error_trace is not None:
__query["error_trace"] = error_trace
if filter_path is not None:
__query["filter_path"] = filter_path
if human is not None:
__query["human"] = human
if if_version is not None:
__query["if_version"] = if_version
if master_timeout is not None:
__query["master_timeout"] = master_timeout
if pretty is not None:
__query["pretty"] = pretty
if timeout is not None:
__query["timeout"] = timeout
if not __body:
if deprecated is not None:
__body["deprecated"] = deprecated
if description is not None:
__body["description"] = description
if meta is not None:
__body["_meta"] = meta
if on_failure is not None:
__body["on_failure"] = on_failure
if processors is not None:
__body["processors"] = processors
if version is not None:
__body["version"] = version
__headers = {"accept": "application/json", "content-type": "application/json"}
return self.perform_request( # type: ignore[return-value]
"PUT",
__path,
params=__query,
headers=__headers,
body=__body,
endpoint_id="ingest.put_pipeline",
path_parts=__path_parts,
)
@_rewrite_parameters(
body_fields=("docs", "pipeline"),
)
def simulate(
self,
*,
docs: t.Optional[t.Sequence[t.Mapping[str, t.Any]]] = None,
id: t.Optional[str] = None,
error_trace: t.Optional[bool] = None,
filter_path: t.Optional[t.Union[str, t.Sequence[str]]] = None,
human: t.Optional[bool] = None,
pipeline: t.Optional[t.Mapping[str, t.Any]] = None,
pretty: t.Optional[bool] = None,
verbose: t.Optional[bool] = None,
body: t.Optional[t.Dict[str, t.Any]] = None,
) -> ObjectApiResponse[t.Any]:
"""
.. raw:: html
<p>Simulate a pipeline.</p>
<p>Run an ingest pipeline against a set of provided documents.
You can either specify an existing pipeline to use with the provided documents or supply a pipeline definition in the body of the request.</p>
`<https://www.elastic.co/docs/api/doc/elasticsearch/operation/operation-ingest-simulate>`_
:param docs: Sample documents to test in the pipeline.
:param id: The pipeline to test. If you don't specify a `pipeline` in the request
body, this parameter is required.
:param pipeline: The pipeline to test. If you don't specify the `pipeline` request
path parameter, this parameter is required. If you specify both this and
the request path parameter, the API only uses the request path parameter.
:param verbose: If `true`, the response includes output data for each processor
in the executed pipeline.
"""
if docs is None and body is None:
raise ValueError("Empty value passed for parameter 'docs'")
__path_parts: t.Dict[str, str]
if id not in SKIP_IN_PATH:
__path_parts = {"id": _quote(id)}
__path = f'/_ingest/pipeline/{__path_parts["id"]}/_simulate'
else:
__path_parts = {}
__path = "/_ingest/pipeline/_simulate"
__query: t.Dict[str, t.Any] = {}
__body: t.Dict[str, t.Any] = body if body is not None else {}
if error_trace is not None:
__query["error_trace"] = error_trace
if filter_path is not None:
__query["filter_path"] = filter_path
if human is not None:
__query["human"] = human
if pretty is not None:
__query["pretty"] = pretty
if verbose is not None:
__query["verbose"] = verbose
if not __body:
if docs is not None:
__body["docs"] = docs
if pipeline is not None:
__body["pipeline"] = pipeline
__headers = {"accept": "application/json", "content-type": "application/json"}
return self.perform_request( # type: ignore[return-value]
"POST",
__path,
params=__query,
headers=__headers,
body=__body,
endpoint_id="ingest.simulate",
path_parts=__path_parts,
)