Files
opensearch-pyd/opensearch/_async/client/__init__.py
T

2092 lines
85 KiB
Python
Raw Normal View History

2020-05-15 09:36:47 -05:00
# -*- coding: utf-8 -*-
# SPDX-License-Identifier: Apache-2.0
#
# The OpenSearch Contributors require contributions made to
# this file be licensed under the Apache-2.0 license or a
# compatible open source license.
#
# Modifications Copyright OpenSearch Contributors. See
# GitHub history for details.
#
# Licensed to Elasticsearch B.V. under one or more contributor
# license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright
# ownership. Elasticsearch B.V. licenses this file to you under
# the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
2020-05-15 09:36:47 -05:00
from __future__ import unicode_literals
2020-05-15 09:36:47 -05:00
import logging
2020-05-20 12:34:29 -05:00
from ..transport import AsyncTransport, TransportError
2020-06-23 15:34:31 -05:00
from .cat import CatClient
from .cluster import ClusterClient
from .dangling_indices import DanglingIndicesClient
2021-03-23 15:12:20 -05:00
from .features import FeaturesClient
from .indices import IndicesClient
from .ingest import IngestClient
from .nodes import NodesClient
from .remote import RemoteClient
from .snapshot import SnapshotClient
from .tasks import TasksClient
from .utils import SKIP_IN_PATH, _bulk_body, _make_path, _normalize_hosts, query_params
2020-05-15 09:36:47 -05:00
2021-08-13 15:51:50 +05:30
logger = logging.getLogger("opensearch")
2020-05-15 09:36:47 -05:00
2021-08-13 15:51:50 +05:30
class AsyncOpenSearch(object):
2020-05-15 09:36:47 -05:00
"""
2021-08-13 15:51:50 +05:30
OpenSearch low-level client. Provides a straightforward mapping from
Python to OpenSearch REST endpoints.
2020-05-15 09:36:47 -05:00
The instance has attributes ``cat``, ``cluster``, ``indices``, ``ingest``,
``nodes``, ``snapshot`` and ``tasks`` that provide access to instances of
2021-08-13 15:51:50 +05:30
:class:`~opensearch.client.CatClient`,
:class:`~opensearch.client.ClusterClient`,
:class:`~opensearch.client.IndicesClient`,
:class:`~opensearch.client.IngestClient`,
:class:`~opensearch.client.NodesClient`,
:class:`~opensearch.client.SnapshotClient` and
:class:`~opensearch.client.TasksClient` respectively. This is the
2020-05-15 09:36:47 -05:00
preferred (and only supported) way to get access to those classes and their
methods.
You can specify your own connection class which should be used by providing
the ``connection_class`` parameter::
# create connection to localhost using the ThriftConnection
client = OpenSearch(connection_class=ThriftConnection)
2020-05-15 09:36:47 -05:00
If you want to turn on :ref:`sniffing` you have several options (described
2021-08-13 15:51:50 +05:30
in :class:`~opensearch.Transport`)::
2020-05-15 09:36:47 -05:00
# create connection that will automatically inspect the cluster to get
# the list of active nodes. Start with nodes running on
# 'opensearchnode1' and 'opensearchnode2'
client = OpenSearch(
['opensearchnode1', 'opensearchnode2'],
2020-05-15 09:36:47 -05:00
# sniff before doing anything
sniff_on_start=True,
# refresh nodes after a node fails to respond
sniff_on_connection_fail=True,
# and also every 60 seconds
sniffer_timeout=60
)
Different hosts can have different parameters, use a dictionary per node to
specify those::
# connect to localhost directly and another node using SSL on port 443
# and an url_prefix. Note that ``port`` needs to be an int.
client = OpenSearch([
2020-05-15 09:36:47 -05:00
{'host': 'localhost'},
{'host': 'othernode', 'port': 443, 'url_prefix': 'opensearch', 'use_ssl': True},
2020-05-15 09:36:47 -05:00
])
If using SSL, there are several parameters that control how we deal with
2021-08-13 15:51:50 +05:30
certificates (see :class:`~opensearch.Urllib3HttpConnection` for
2020-05-15 09:36:47 -05:00
detailed description of the options)::
client = OpenSearch(
2020-05-15 09:36:47 -05:00
['localhost:443', 'other_host:443'],
# turn on SSL
use_ssl=True,
# make sure we verify SSL certificates
verify_certs=True,
# provide a path to CA certs on disk
ca_certs='/path/to/CA_certs'
)
If using SSL, but don't verify the certs, a warning message is showed
2021-08-13 15:51:50 +05:30
optionally (see :class:`~opensearch.Urllib3HttpConnection` for
2020-05-15 09:36:47 -05:00
detailed description of the options)::
client = OpenSearch(
2020-05-15 09:36:47 -05:00
['localhost:443', 'other_host:443'],
# turn on SSL
use_ssl=True,
# no verify SSL certificates
verify_certs=False,
# don't show warnings about ssl certs verification
ssl_show_warn=False
)
SSL client authentication is supported
2021-08-13 15:51:50 +05:30
(see :class:`~opensearch.Urllib3HttpConnection` for
2020-05-15 09:36:47 -05:00
detailed description of the options)::
client = OpenSearch(
2020-05-15 09:36:47 -05:00
['localhost:443', 'other_host:443'],
# turn on SSL
use_ssl=True,
# make sure we verify SSL certificates
verify_certs=True,
# provide a path to CA certs on disk
ca_certs='/path/to/CA_certs',
# PEM formatted SSL client certificate
client_cert='/path/to/clientcert.pem',
# PEM formatted SSL client key
client_key='/path/to/clientkey.pem'
)
Alternatively you can use RFC-1738 formatted URLs, as long as they are not
in conflict with other options::
client = OpenSearch(
2020-05-15 09:36:47 -05:00
[
'http://user:secret@localhost:9200/',
'https://user:secret@other_host:443/production'
],
verify_certs=True
)
By default, `JSONSerializer
2021-08-13 15:51:50 +05:30
<https://github.com/opensearch-project/opensearch-py/blob/master/opensearch/serializer.py#L24>`_
2020-05-15 09:36:47 -05:00
is used to encode all outgoing requests.
However, you can implement your own custom serializer::
2021-08-13 15:51:50 +05:30
from opensearch.serializer import JSONSerializer
2020-05-15 09:36:47 -05:00
class SetEncoder(JSONSerializer):
def default(self, obj):
if isinstance(obj, set):
return list(obj)
if isinstance(obj, Something):
return 'CustomSomethingRepresentation'
return JSONSerializer.default(self, obj)
client = OpenSearch(serializer=SetEncoder())
2020-05-15 09:36:47 -05:00
"""
2020-05-20 12:34:29 -05:00
def __init__(self, hosts=None, transport_class=AsyncTransport, **kwargs):
2020-05-15 09:36:47 -05:00
"""
:arg hosts: list of nodes, or a single node, we should connect to.
Node should be a dictionary ({"host": "localhost", "port": 9200}),
2021-08-13 15:51:50 +05:30
the entire dictionary will be passed to the :class:`~opensearch.Connection`
2020-05-15 09:36:47 -05:00
class as kwargs, or a string in the format of ``host[:port]`` which will be
translated to a dictionary automatically. If no value is given the
2021-08-13 15:51:50 +05:30
:class:`~opensearch.Connection` class defaults will be used.
2020-05-15 09:36:47 -05:00
2021-08-13 15:51:50 +05:30
:arg transport_class: :class:`~opensearch.Transport` subclass to use.
2020-05-15 09:36:47 -05:00
:arg kwargs: any additional arguments will be passed on to the
2021-08-13 15:51:50 +05:30
:class:`~opensearch.Transport` class and, subsequently, to the
:class:`~opensearch.Connection` instances.
2020-05-15 09:36:47 -05:00
"""
self.transport = transport_class(_normalize_hosts(hosts), **kwargs)
# namespaced clients for compatibility with API names
2020-06-23 15:34:31 -05:00
self.cat = CatClient(self)
self.cluster = ClusterClient(self)
self.dangling_indices = DanglingIndicesClient(self)
2020-05-15 09:36:47 -05:00
self.indices = IndicesClient(self)
self.ingest = IngestClient(self)
self.nodes = NodesClient(self)
self.remote = RemoteClient(self)
self.snapshot = SnapshotClient(self)
self.tasks = TasksClient(self)
2021-03-23 15:12:20 -05:00
self.features = FeaturesClient(self)
2020-05-15 09:36:47 -05:00
def __repr__(self):
try:
# get a list of all connections
cons = self.transport.hosts
# truncate to 5 if there are too many
if len(cons) > 5:
cons = cons[:5] + ["..."]
return "<{cls}({cons})>".format(cls=self.__class__.__name__, cons=cons)
except Exception:
# probably operating on custom transport and connection_pool, ignore
2021-08-13 15:51:50 +05:30
return super(AsyncOpenSearch, self).__repr__()
2020-05-20 12:34:29 -05:00
async def __aenter__(self):
if hasattr(self.transport, "_async_call"):
await self.transport._async_call()
return self
async def __aexit__(self, *_):
await self.close()
async def close(self):
2020-05-29 12:27:02 -05:00
"""Closes the Transport and all internal connections"""
2020-05-20 12:34:29 -05:00
await self.transport.close()
2020-05-15 09:36:47 -05:00
# AUTO-GENERATED-API-DEFINITIONS #
@query_params()
2020-05-20 12:34:29 -05:00
async def ping(self, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns whether the cluster is running.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
"""
try:
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"HEAD", "/", params=params, headers=headers
)
except TransportError:
return False
@query_params()
2020-05-20 12:34:29 -05:00
async def info(self, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns basic information about the cluster.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"GET", "/", params=params, headers=headers
)
@query_params(
"pipeline",
"refresh",
"routing",
"timeout",
"version",
"version_type",
"wait_for_active_shards",
)
2020-05-20 12:34:29 -05:00
async def create(self, index, id, body, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Creates a new document in the index. Returns a 409 response when a document
with a same ID already exists in the index.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: Document ID
:arg body: The document
:arg doc_type: The type of the document
:arg pipeline: The pipeline id to preprocess incoming documents
with
:arg refresh: If `true` then refresh the affected shards to make
this operation visible to search, if `wait_for` then wait for a refresh
to make this operation visible to search, if `false` (the default) then
2020-06-03 10:38:35 -05:00
do nothing with refreshes. Valid choices: true, false, wait_for
2020-05-15 09:36:47 -05:00
:arg routing: Specific routing value
:arg timeout: Explicit operation timeout
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-15 09:36:47 -05:00
internal, external, external_gte
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the index operation. Defaults
to 1, meaning the primary shard only. Set to `all` for all shard copies,
otherwise set to any non-negative value less than or equal to the total
number of copies for the shard (number of replicas + 1)
"""
for param in (index, id, body):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
if doc_type in SKIP_IN_PATH:
2020-05-21 14:57:59 -05:00
path = _make_path(index, "_create", id)
else:
path = _make_path(index, doc_type, id, "_create")
2020-05-15 09:36:47 -05:00
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"PUT", path, params=params, headers=headers, body=body
2020-05-15 09:36:47 -05:00
)
@query_params(
"if_primary_term",
"if_seq_no",
"op_type",
"pipeline",
"refresh",
2020-07-29 15:51:19 -05:00
"require_alias",
2020-05-15 09:36:47 -05:00
"routing",
"timeout",
"version",
"version_type",
"wait_for_active_shards",
)
2020-05-20 12:34:29 -05:00
async def index(
self, index, body, doc_type=None, id=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Creates or updates a document in an index.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg body: The document
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document
2020-05-15 09:36:47 -05:00
:arg id: Document ID
:arg if_primary_term: only perform the index operation if the
last operation that has changed the document has the specified primary
term
:arg if_seq_no: only perform the index operation if the last
operation that has changed the document has the specified sequence
number
:arg op_type: Explicit operation type. Defaults to `index` for
requests with an explicit document ID, and to `create`for requests
2020-06-03 10:38:35 -05:00
without an explicit document ID Valid choices: index, create
2020-05-15 09:36:47 -05:00
:arg pipeline: The pipeline id to preprocess incoming documents
with
:arg refresh: If `true` then refresh the affected shards to make
this operation visible to search, if `wait_for` then wait for a refresh
to make this operation visible to search, if `false` (the default) then
2020-06-03 10:38:35 -05:00
do nothing with refreshes. Valid choices: true, false, wait_for
2020-07-29 15:51:19 -05:00
:arg require_alias: When true, requires destination to be an
alias. Default is false
2020-05-15 09:36:47 -05:00
:arg routing: Specific routing value
:arg timeout: Explicit operation timeout
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-15 09:36:47 -05:00
internal, external, external_gte
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the index operation. Defaults
to 1, meaning the primary shard only. Set to `all` for all shard copies,
otherwise set to any non-negative value less than or equal to the total
number of copies for the shard (number of replicas + 1)
"""
for param in (index, body):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
if doc_type is None:
doc_type = "_doc"
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST" if id in SKIP_IN_PATH else "PUT",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, id),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"pipeline",
"refresh",
2020-07-29 15:51:19 -05:00
"require_alias",
2020-05-15 09:36:47 -05:00
"routing",
"timeout",
"wait_for_active_shards",
)
2020-05-20 12:34:29 -05:00
async def bulk(self, body, index=None, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to perform multiple index/update/delete operations in a single request.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The operation definition and data (action-data
pairs), separated by newlines
:arg index: Default index for items which don't provide one
:arg doc_type: Default document type for items which don't
provide one
:arg _source: True or false to return the _source field or not,
or default list of fields to return, can be overridden on each sub-
request
:arg _source_excludes: Default list of fields to exclude from
the returned _source field, can be overridden on each sub-request
:arg _source_includes: Default list of fields to extract and
return from the _source field, can be overridden on each sub-request
:arg pipeline: The pipeline id to preprocess incoming documents
with
:arg refresh: If `true` then refresh the affected shards to make
this operation visible to search, if `wait_for` then wait for a refresh
to make this operation visible to search, if `false` (the default) then
2020-06-03 10:38:35 -05:00
do nothing with refreshes. Valid choices: true, false, wait_for
2020-07-29 15:51:19 -05:00
:arg require_alias: Sets require_alias for all incoming
documents. Defaults to unset (false)
2020-05-15 09:36:47 -05:00
:arg routing: Specific routing value
:arg timeout: Explicit operation timeout
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the bulk operation. Defaults
to 1, meaning the primary shard only. Set to `all` for all shard copies,
otherwise set to any non-negative value less than or equal to the total
number of copies for the shard (number of replicas + 1)
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
body = _bulk_body(self.transport.serializer, body)
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
_make_path(index, doc_type, "_bulk"),
params=params,
headers=headers,
body=body,
)
@query_params()
2020-05-20 12:34:29 -05:00
async def clear_scroll(self, body=None, scroll_id=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Explicitly clears the search context for a scroll.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: A comma-separated list of scroll IDs to clear if none
was specified via the scroll_id parameter
:arg scroll_id: A comma-separated list of scroll IDs to clear
"""
if scroll_id in SKIP_IN_PATH and body in SKIP_IN_PATH:
raise ValueError("You need to supply scroll_id or body.")
elif scroll_id and not body:
body = {"scroll_id": [scroll_id]}
elif scroll_id:
params["scroll_id"] = scroll_id
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"DELETE", "/_search/scroll", params=params, headers=headers, body=body
)
@query_params(
"allow_no_indices",
"analyze_wildcard",
"analyzer",
"default_operator",
"df",
"expand_wildcards",
"ignore_throttled",
"ignore_unavailable",
"lenient",
"min_score",
"preference",
"q",
"routing",
"terminate_after",
)
2020-05-20 12:34:29 -05:00
async def count(
self, body=None, index=None, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Returns number of documents matching a query.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: A query to restrict the results specified with the
Query DSL (optional)
:arg index: A comma-separated list of indices to restrict the
results
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of types to restrict the
results
2020-05-15 09:36:47 -05:00
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg analyze_wildcard: Specify whether wildcard and prefix
queries should be analyzed (default: false)
:arg analyzer: The analyzer to use for the query string
:arg default_operator: The default operator for query string
2020-06-03 10:38:35 -05:00
query (AND or OR) Valid choices: AND, OR Default: OR
2020-05-15 09:36:47 -05:00
:arg df: The field to use as default where no field prefix is
given in the query string
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg ignore_throttled: Whether specified concrete, expanded or
aliased indices should be ignored when throttled
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg lenient: Specify whether format-based query failures (such
as providing text to a numeric field) should be ignored
:arg min_score: Include only documents with a specific `_score`
value in the result
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg q: Query in the Lucene query string syntax
:arg routing: A comma-separated list of specific routing values
:arg terminate_after: The maximum count for each shard, upon
reaching which the query execution will terminate early
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_count"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params(
"if_primary_term",
"if_seq_no",
"refresh",
"routing",
"timeout",
"version",
"version_type",
"wait_for_active_shards",
)
2020-05-20 12:34:29 -05:00
async def delete(self, index, id, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Removes a document from the index.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
:arg doc_type: The type of the document
:arg if_primary_term: only perform the delete operation if the
last operation that has changed the document has the specified primary
term
:arg if_seq_no: only perform the delete operation if the last
operation that has changed the document has the specified sequence
number
:arg refresh: If `true` then refresh the affected shards to make
this operation visible to search, if `wait_for` then wait for a refresh
to make this operation visible to search, if `false` (the default) then
2020-06-03 10:38:35 -05:00
do nothing with refreshes. Valid choices: true, false, wait_for
2020-05-15 09:36:47 -05:00
:arg routing: Specific routing value
:arg timeout: Explicit operation timeout
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the delete operation.
Defaults to 1, meaning the primary shard only. Set to `all` for all
shard copies, otherwise set to any non-negative value less than or equal
to the total number of copies for the shard (number of replicas + 1)
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
if doc_type in SKIP_IN_PATH:
doc_type = "_doc"
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"DELETE", _make_path(index, doc_type, id), params=params, headers=headers
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"allow_no_indices",
"analyze_wildcard",
"analyzer",
"conflicts",
"default_operator",
"df",
"expand_wildcards",
"from_",
"ignore_unavailable",
"lenient",
"max_docs",
"preference",
"q",
"refresh",
"request_cache",
"requests_per_second",
"routing",
"scroll",
"scroll_size",
"search_timeout",
"search_type",
2020-05-20 12:34:29 -05:00
"size",
2020-05-15 09:36:47 -05:00
"slices",
"sort",
"stats",
"terminate_after",
"timeout",
"version",
"wait_for_active_shards",
"wait_for_completion",
)
2020-05-20 12:34:29 -05:00
async def delete_by_query(
self, index, body, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Deletes documents matching the provided query.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
:arg body: The search definition using the Query DSL
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of document types to
search; leave empty to perform the operation on all types
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg analyze_wildcard: Specify whether wildcard and prefix
queries should be analyzed (default: false)
:arg analyzer: The analyzer to use for the query string
:arg conflicts: What to do when the delete by query hits version
2020-06-03 10:38:35 -05:00
conflicts? Valid choices: abort, proceed Default: abort
2020-05-15 09:36:47 -05:00
:arg default_operator: The default operator for query string
2020-06-03 10:38:35 -05:00
query (AND or OR) Valid choices: AND, OR Default: OR
2020-05-15 09:36:47 -05:00
:arg df: The field to use as default where no field prefix is
given in the query string
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-20 12:34:29 -05:00
:arg from_: Starting offset (default: 0)
2020-05-15 09:36:47 -05:00
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg lenient: Specify whether format-based query failures (such
as providing text to a numeric field) should be ignored
:arg max_docs: Maximum number of documents to process (default:
all documents)
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg q: Query in the Lucene query string syntax
2020-05-20 12:34:29 -05:00
:arg refresh: Should the effected indexes be refreshed?
2020-05-15 09:36:47 -05:00
:arg request_cache: Specify if request cache should be used for
this request or not, defaults to index level setting
:arg requests_per_second: The throttle for this request in sub-
requests per second. -1 means no throttle.
:arg routing: A comma-separated list of specific routing values
:arg scroll: Specify how long a consistent view of the index
should be maintained for scrolled search
:arg scroll_size: Size on the scroll request powering the delete
2020-06-03 10:38:35 -05:00
by query Default: 100
2020-05-15 09:36:47 -05:00
:arg search_timeout: Explicit timeout for each search request.
Defaults to no timeout.
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2020-05-15 09:36:47 -05:00
query_then_fetch, dfs_query_then_fetch
2020-05-20 12:34:29 -05:00
:arg size: Deprecated, please use `max_docs` instead
2020-05-15 09:36:47 -05:00
:arg slices: The number of slices this task should be divided
into. Defaults to 1, meaning the task isn't sliced into subtasks. Can be
2020-06-03 10:38:35 -05:00
set to `auto`. Default: 1
2020-05-15 09:36:47 -05:00
:arg sort: A comma-separated list of <field>:<direction> pairs
:arg stats: Specific 'tag' of the request for logging and
statistical purposes
:arg terminate_after: The maximum number of documents to collect
for each shard, upon reaching which the query execution will terminate
early.
:arg timeout: Time each individual bulk request should wait for
2020-06-03 10:38:35 -05:00
shards that are unavailable. Default: 1m
2020-05-15 09:36:47 -05:00
:arg version: Specify whether to return document version as part
of a hit
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the delete by query
operation. Defaults to 1, meaning the primary shard only. Set to `all`
for all shard copies, otherwise set to any non-negative value less than
or equal to the total number of copies for the shard (number of replicas
+ 1)
:arg wait_for_completion: Should the request should block until
2020-06-03 10:38:35 -05:00
the delete by query is complete. Default: True
2020-05-15 09:36:47 -05:00
"""
# from is a reserved word so it cannot be used, use from_ instead
if "from_" in params:
params["from"] = params.pop("from_")
for param in (index, body):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_delete_by_query"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params("requests_per_second")
2020-05-20 12:34:29 -05:00
async def delete_by_query_rethrottle(self, task_id, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Changes the number of requests per second for a particular Delete By Query
operation.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg task_id: The task id to rethrottle
:arg requests_per_second: The throttle to set on this request in
floating sub-requests per second. -1 means set no throttle.
"""
if task_id in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'task_id'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
_make_path("_delete_by_query", task_id, "_rethrottle"),
params=params,
headers=headers,
)
@query_params("master_timeout", "timeout")
2020-05-20 12:34:29 -05:00
async def delete_script(self, id, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Deletes a script.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg id: Script ID
:arg master_timeout: Specify timeout for connection to master
:arg timeout: Explicit operation timeout
"""
if id in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'id'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"DELETE", _make_path("_scripts", id), params=params, headers=headers
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"preference",
"realtime",
"refresh",
"routing",
"stored_fields",
"version",
"version_type",
)
2020-05-20 12:34:29 -05:00
async def exists(self, index, id, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns information about whether a document exists in an index.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document (use `_all` to fetch the
first document matching the ID across all types)
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg realtime: Specify whether to perform the operation in
realtime or search mode
:arg refresh: Refresh the shard containing the document before
performing the operation
:arg routing: Specific routing value
:arg stored_fields: A comma-separated list of stored fields to
return in the response
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
if doc_type in SKIP_IN_PATH:
doc_type = "_doc"
return await self.transport.perform_request(
"HEAD", _make_path(index, doc_type, id), params=params, headers=headers
2020-05-15 09:36:47 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"preference",
"realtime",
"refresh",
"routing",
"version",
"version_type",
)
2020-05-20 12:34:29 -05:00
async def exists_source(self, index, id, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns information about whether a document source exists in an index.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
:arg doc_type: The type of the document; deprecated and optional
starting with 7.0
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg realtime: Specify whether to perform the operation in
realtime or search mode
:arg refresh: Refresh the shard containing the document before
performing the operation
:arg routing: Specific routing value
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-06-03 10:38:35 -05:00
if doc_type in SKIP_IN_PATH:
path = _make_path(index, "_source", id)
else:
path = _make_path(index, doc_type, id, "_source")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-06-03 10:38:35 -05:00
"HEAD", path, params=params, headers=headers
2020-05-15 09:36:47 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"analyze_wildcard",
"analyzer",
"default_operator",
"df",
"lenient",
"preference",
"q",
"routing",
"stored_fields",
)
2020-05-20 12:34:29 -05:00
async def explain(
self, index, id, body=None, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Returns information about why a specific matches (or doesn't match) a query.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
:arg body: The query definition using the Query DSL
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg analyze_wildcard: Specify whether wildcards and prefix
queries in the query string query should be analyzed (default: false)
:arg analyzer: The analyzer for the query string query
:arg default_operator: The default operator for query string
2020-06-03 10:38:35 -05:00
query (AND or OR) Valid choices: AND, OR Default: OR
2020-05-15 09:36:47 -05:00
:arg df: The default field for query string query (default:
_all)
:arg lenient: Specify whether format-based query failures (such
as providing text to a numeric field) should be ignored
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg q: Query in the Lucene query string syntax
:arg routing: Specific routing value
:arg stored_fields: A comma-separated list of stored fields to
return in the response
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
if doc_type in SKIP_IN_PATH:
2020-05-21 14:57:59 -05:00
path = _make_path(index, "_explain", id)
else:
path = _make_path(index, doc_type, id, "_explain")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"POST", path, params=params, headers=headers, body=body
2020-05-15 09:36:47 -05:00
)
@query_params(
"allow_no_indices",
"expand_wildcards",
"fields",
"ignore_unavailable",
"include_unmapped",
)
2020-06-23 15:34:31 -05:00
async def field_caps(self, body=None, index=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns the information about the capabilities of fields among multiple
indices.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
2020-06-23 15:34:31 -05:00
:arg body: An index filter specified with the Query DSL
2020-05-15 09:36:47 -05:00
:arg index: A comma-separated list of index names; use `_all` or
empty string to perform the operation on all indices
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg fields: A comma-separated list of field names
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg include_unmapped: Indicates whether unmapped fields should
be included in the response.
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-06-23 15:34:31 -05:00
"POST",
_make_path(index, "_field_caps"),
params=params,
headers=headers,
body=body,
2020-05-15 09:36:47 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"preference",
"realtime",
"refresh",
"routing",
"stored_fields",
"version",
"version_type",
)
2020-05-20 12:34:29 -05:00
async def get(self, index, id, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns a document.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document (use `_all` to fetch the
first document matching the ID across all types)
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg realtime: Specify whether to perform the operation in
realtime or search mode
:arg refresh: Refresh the shard containing the document before
performing the operation
:arg routing: Specific routing value
:arg stored_fields: A comma-separated list of stored fields to
return in the response
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
if doc_type in SKIP_IN_PATH:
doc_type = "_doc"
return await self.transport.perform_request(
"GET", _make_path(index, doc_type, id), params=params, headers=headers
2020-05-15 09:36:47 -05:00
)
@query_params("master_timeout")
2020-05-20 12:34:29 -05:00
async def get_script(self, id, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns a script.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg id: Script ID
:arg master_timeout: Specify timeout for connection to master
"""
if id in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'id'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"GET", _make_path("_scripts", id), params=params, headers=headers
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"preference",
"realtime",
"refresh",
"routing",
"version",
"version_type",
)
2020-05-20 12:34:29 -05:00
async def get_source(self, index, id, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns the source of a document.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
:arg id: The document ID
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document; deprecated and optional
starting with 7.0
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg realtime: Specify whether to perform the operation in
realtime or search mode
:arg refresh: Refresh the shard containing the document before
performing the operation
:arg routing: Specific routing value
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
"""
for param in (index, id):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
if doc_type in SKIP_IN_PATH:
2020-05-21 14:57:59 -05:00
path = _make_path(index, "_source", id)
else:
path = _make_path(index, doc_type, id, "_source")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"GET", path, params=params, headers=headers
2020-05-15 09:36:47 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"preference",
"realtime",
"refresh",
"routing",
"stored_fields",
)
2020-05-20 12:34:29 -05:00
async def mget(self, body, index=None, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to get multiple documents in one request.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: Document identifiers; can be either `docs`
2020-05-20 12:34:29 -05:00
(containing full document information) or `ids` (when index and type is
provided in the URL.
2020-05-15 09:36:47 -05:00
:arg index: The name of the index
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg realtime: Specify whether to perform the operation in
realtime or search mode
:arg refresh: Refresh the shard containing the document before
performing the operation
:arg routing: Specific routing value
:arg stored_fields: A comma-separated list of stored fields to
return in the response
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_mget"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params(
"ccs_minimize_roundtrips",
"max_concurrent_searches",
"max_concurrent_shard_requests",
"pre_filter_shard_size",
"rest_total_hits_as_int",
"search_type",
"typed_keys",
)
2020-05-20 12:34:29 -05:00
async def msearch(self, body, index=None, doc_type=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to execute several search operations in one request.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The request definitions (metadata-search request
definition pairs), separated by newlines
:arg index: A comma-separated list of index names to use as
default
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of document types to use
as default
2020-05-15 09:36:47 -05:00
:arg ccs_minimize_roundtrips: Indicates whether network round-
trips should be minimized as part of cross-cluster search requests
2020-06-03 10:38:35 -05:00
execution Default: true
2020-05-15 09:36:47 -05:00
:arg max_concurrent_searches: Controls the maximum number of
concurrent searches the multi search api will execute
:arg max_concurrent_shard_requests: The number of concurrent
shard requests each sub search executes concurrently per node. This
value should be used to limit the impact of the search on the cluster in
2020-06-03 10:38:35 -05:00
order to limit the number of concurrent shard requests Default: 5
2020-05-15 09:36:47 -05:00
:arg pre_filter_shard_size: A threshold that enforces a pre-
filter roundtrip to prefilter search shards based on query rewriting if
the number of shards the search request expands to exceeds the
threshold. This filter roundtrip can limit the number of shards
significantly if for instance a shard can not match any documents based
on its rewrite method ie. if date filters are mandatory to match but the
shard bounds and the query are disjoint.
:arg rest_total_hits_as_int: Indicates whether hits.total should
be rendered as an integer or an object in the rest search response
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2021-05-03 10:30:13 -05:00
query_then_fetch, dfs_query_then_fetch
2020-05-15 09:36:47 -05:00
:arg typed_keys: Specify whether aggregation and suggester names
should be prefixed by their respective types in the response
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
body = _bulk_body(self.transport.serializer, body)
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_msearch"),
params=params,
headers=headers,
body=body,
)
@query_params(
"ccs_minimize_roundtrips",
"max_concurrent_searches",
"rest_total_hits_as_int",
"search_type",
"typed_keys",
)
async def msearch_template(
self, body, index=None, doc_type=None, params=None, headers=None
):
"""
Allows to execute several search template operations in one request.
2020-10-20 13:02:15 -05:00
2020-05-20 12:34:29 -05:00
:arg body: The request definitions (metadata-search request
definition pairs), separated by newlines
:arg index: A comma-separated list of index names to use as
default
:arg doc_type: A comma-separated list of document types to use
as default
:arg ccs_minimize_roundtrips: Indicates whether network round-
trips should be minimized as part of cross-cluster search requests
2020-06-03 10:38:35 -05:00
execution Default: true
2020-05-20 12:34:29 -05:00
:arg max_concurrent_searches: Controls the maximum number of
concurrent searches the multi search api will execute
:arg rest_total_hits_as_int: Indicates whether hits.total should
be rendered as an integer or an object in the rest search response
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2021-05-03 10:30:13 -05:00
query_then_fetch, dfs_query_then_fetch
2020-05-20 12:34:29 -05:00
:arg typed_keys: Specify whether aggregation and suggester names
should be prefixed by their respective types in the response
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
body = _bulk_body(self.transport.serializer, body)
return await self.transport.perform_request(
"POST",
_make_path(index, doc_type, "_msearch", "template"),
params=params,
headers=headers,
body=body,
)
@query_params(
"field_statistics",
"fields",
"ids",
"offsets",
"payloads",
"positions",
"preference",
"realtime",
"routing",
"term_statistics",
"version",
"version_type",
)
async def mtermvectors(
self, body=None, index=None, doc_type=None, params=None, headers=None
):
"""
Returns multiple termvectors in one request.
2020-10-20 13:02:15 -05:00
2020-05-20 12:34:29 -05:00
:arg body: Define ids, documents, parameters or a list of
parameters per document here. You must at least provide a list of
document ids. See documentation.
:arg index: The index in which the document resides.
:arg doc_type: The type of the document.
:arg field_statistics: Specifies if document count, sum of
document frequencies and sum of total term frequencies should be
returned. Applies to all returned documents unless otherwise specified
2020-06-03 10:38:35 -05:00
in body "params" or "docs". Default: True
2020-05-20 12:34:29 -05:00
:arg fields: A comma-separated list of fields to return. Applies
to all returned documents unless otherwise specified in body "params" or
"docs".
:arg ids: A comma-separated list of documents ids. You must
define ids as parameter or set "ids" or "docs" in the request body
:arg offsets: Specifies if term offsets should be returned.
Applies to all returned documents unless otherwise specified in body
2020-06-03 10:38:35 -05:00
"params" or "docs". Default: True
2020-05-20 12:34:29 -05:00
:arg payloads: Specifies if term payloads should be returned.
Applies to all returned documents unless otherwise specified in body
2020-06-03 10:38:35 -05:00
"params" or "docs". Default: True
2020-05-20 12:34:29 -05:00
:arg positions: Specifies if term positions should be returned.
Applies to all returned documents unless otherwise specified in body
2020-06-03 10:38:35 -05:00
"params" or "docs". Default: True
2020-05-20 12:34:29 -05:00
:arg preference: Specify the node or shard the operation should
be performed on (default: random) .Applies to all returned documents
unless otherwise specified in body "params" or "docs".
:arg realtime: Specifies if requests are real-time as opposed to
near-real-time (default: true).
:arg routing: Specific routing value. Applies to all returned
documents unless otherwise specified in body "params" or "docs".
:arg term_statistics: Specifies if total term frequency and
document frequency should be returned. Applies to all returned documents
unless otherwise specified in body "params" or "docs".
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
"""
2020-05-21 14:57:59 -05:00
if doc_type in SKIP_IN_PATH:
path = _make_path(index, "_mtermvectors")
else:
path = _make_path(index, doc_type, "_mtermvectors")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"POST", path, params=params, headers=headers, body=body
2020-05-15 09:36:47 -05:00
)
@query_params("master_timeout", "timeout")
2020-05-20 12:34:29 -05:00
async def put_script(self, id, body, context=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Creates or updates a script.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg id: Script ID
:arg body: The document
:arg context: Context name to compile script against
:arg master_timeout: Specify timeout for connection to master
:arg timeout: Explicit operation timeout
"""
for param in (id, body):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"PUT",
_make_path("_scripts", id, context),
params=params,
headers=headers,
body=body,
)
@query_params(
"allow_no_indices", "expand_wildcards", "ignore_unavailable", "search_type"
)
2020-05-20 12:34:29 -05:00
async def rank_eval(self, body, index=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to evaluate the quality of ranked search results over a set of typical
search queries
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
.. warning::
This API is **experimental** so may include breaking changes
or be removed in a future version
2020-05-15 09:36:47 -05:00
:arg body: The ranking evaluation search definition, including
search requests, document ratings and ranking metric definition.
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2020-05-15 09:36:47 -05:00
query_then_fetch, dfs_query_then_fetch
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
_make_path(index, "_rank_eval"),
params=params,
headers=headers,
body=body,
)
@query_params(
"max_docs",
"refresh",
"requests_per_second",
"scroll",
"slices",
"timeout",
"wait_for_active_shards",
"wait_for_completion",
)
2020-05-20 12:34:29 -05:00
async def reindex(self, body, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to copy documents from one index to another, optionally filtering the
source documents by a query, changing the destination index settings, or
fetching the documents from a remote cluster.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The search definition using the Query DSL and the
prototype for the index request.
:arg max_docs: Maximum number of documents to process (default:
all documents)
:arg refresh: Should the affected indexes be refreshed?
:arg requests_per_second: The throttle to set on this request in
sub-requests per second. -1 means no throttle.
:arg scroll: Control how long to keep the search context alive
Default: 5m
:arg slices: The number of slices this task should be divided
into. Defaults to 1, meaning the task isn't sliced into subtasks. Can be
2020-06-03 10:38:35 -05:00
set to `auto`. Default: 1
2020-05-15 09:36:47 -05:00
:arg timeout: Time each individual bulk request should wait for
2020-06-03 10:38:35 -05:00
shards that are unavailable. Default: 1m
2020-05-15 09:36:47 -05:00
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the reindex operation.
Defaults to 1, meaning the primary shard only. Set to `all` for all
shard copies, otherwise set to any non-negative value less than or equal
to the total number of copies for the shard (number of replicas + 1)
:arg wait_for_completion: Should the request should block until
2020-06-03 10:38:35 -05:00
the reindex is complete. Default: True
2020-05-15 09:36:47 -05:00
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST", "/_reindex", params=params, headers=headers, body=body
)
@query_params("requests_per_second")
2020-05-20 12:34:29 -05:00
async def reindex_rethrottle(self, task_id, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Changes the number of requests per second for a particular Reindex operation.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg task_id: The task id to rethrottle
:arg requests_per_second: The throttle to set on this request in
floating sub-requests per second. -1 means set no throttle.
"""
if task_id in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'task_id'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
_make_path("_reindex", task_id, "_rethrottle"),
params=params,
headers=headers,
)
@query_params()
2020-05-20 12:34:29 -05:00
async def render_search_template(
self, body=None, id=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Allows to use the Mustache language to pre-render a search definition.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The search definition template and its params
:arg id: The id of the stored search template
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
_make_path("_render", "template", id),
params=params,
headers=headers,
body=body,
)
@query_params()
2020-05-20 12:34:29 -05:00
async def scripts_painless_execute(self, body=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows an arbitrary script to be executed and a result to be returned
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
.. warning::
This API is **experimental** so may include breaking changes
or be removed in a future version
2020-05-15 09:36:47 -05:00
:arg body: The script to execute
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
"/_scripts/painless/_execute",
params=params,
headers=headers,
body=body,
)
@query_params("rest_total_hits_as_int", "scroll")
2020-05-20 12:34:29 -05:00
async def scroll(self, body=None, scroll_id=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Allows to retrieve a large numbers of results from a single search request.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The scroll ID if not passed by URL or query
parameter.
:arg scroll_id: The scroll ID for scrolled search
:arg rest_total_hits_as_int: Indicates whether hits.total should
be rendered as an integer or an object in the rest search response
:arg scroll: Specify how long a consistent view of the index
should be maintained for scrolled search
"""
if scroll_id in SKIP_IN_PATH and body in SKIP_IN_PATH:
raise ValueError("You need to supply scroll_id or body.")
elif scroll_id and not body:
body = {"scroll_id": scroll_id}
elif scroll_id:
params["scroll_id"] = scroll_id
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST", "/_search/scroll", params=params, headers=headers, body=body
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"allow_no_indices",
"allow_partial_search_results",
"analyze_wildcard",
"analyzer",
"batched_reduce_size",
"ccs_minimize_roundtrips",
"default_operator",
"df",
"docvalue_fields",
"expand_wildcards",
"explain",
"from_",
"ignore_throttled",
"ignore_unavailable",
"lenient",
"max_concurrent_shard_requests",
"min_compatible_shard_node",
2020-05-15 09:36:47 -05:00
"pre_filter_shard_size",
"preference",
"q",
"request_cache",
"rest_total_hits_as_int",
"routing",
"scroll",
"search_type",
"seq_no_primary_term",
"size",
"sort",
"stats",
"stored_fields",
"suggest_field",
"suggest_mode",
"suggest_size",
"suggest_text",
"terminate_after",
"timeout",
"track_scores",
"track_total_hits",
"typed_keys",
"version",
)
2020-05-20 12:34:29 -05:00
async def search(
self, body=None, index=None, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Returns results matching a query.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The search definition using the Query DSL
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of document types to
search; leave empty to perform the operation on all types
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg allow_partial_search_results: Indicate if an error should
2020-06-03 10:38:35 -05:00
be returned if there is a partial search failure or timeout Default:
2020-05-15 09:36:47 -05:00
True
:arg analyze_wildcard: Specify whether wildcard and prefix
queries should be analyzed (default: false)
:arg analyzer: The analyzer to use for the query string
:arg batched_reduce_size: The number of shard results that
should be reduced at once on the coordinating node. This value should be
used as a protection mechanism to reduce the memory overhead per search
request if the potential number of shards in the request can be large.
Default: 512
:arg ccs_minimize_roundtrips: Indicates whether network round-
trips should be minimized as part of cross-cluster search requests
2020-06-03 10:38:35 -05:00
execution Default: true
2020-05-15 09:36:47 -05:00
:arg default_operator: The default operator for query string
2020-06-03 10:38:35 -05:00
query (AND or OR) Valid choices: AND, OR Default: OR
2020-05-15 09:36:47 -05:00
:arg df: The field to use as default where no field prefix is
given in the query string
:arg docvalue_fields: A comma-separated list of fields to return
as the docvalue representation of a field for each hit
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg explain: Specify whether to return detailed information
about score computation as part of a hit
2020-05-20 12:34:29 -05:00
:arg from_: Starting offset (default: 0)
2020-05-15 09:36:47 -05:00
:arg ignore_throttled: Whether specified concrete, expanded or
aliased indices should be ignored when throttled
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg lenient: Specify whether format-based query failures (such
as providing text to a numeric field) should be ignored
:arg max_concurrent_shard_requests: The number of concurrent
shard requests per node this search executes concurrently. This value
should be used to limit the impact of the search on the cluster in order
2020-06-03 10:38:35 -05:00
to limit the number of concurrent shard requests Default: 5
:arg min_compatible_shard_node: The minimum compatible version
that all shards involved in search should have for this request to be
successful
2020-05-15 09:36:47 -05:00
:arg pre_filter_shard_size: A threshold that enforces a pre-
filter roundtrip to prefilter search shards based on query rewriting if
the number of shards the search request expands to exceeds the
threshold. This filter roundtrip can limit the number of shards
significantly if for instance a shard can not match any documents based
on its rewrite method ie. if date filters are mandatory to match but the
shard bounds and the query are disjoint.
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg q: Query in the Lucene query string syntax
:arg request_cache: Specify if request cache should be used for
this request or not, defaults to index level setting
:arg rest_total_hits_as_int: Indicates whether hits.total should
be rendered as an integer or an object in the rest search response
:arg routing: A comma-separated list of specific routing values
:arg scroll: Specify how long a consistent view of the index
should be maintained for scrolled search
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2020-05-15 09:36:47 -05:00
query_then_fetch, dfs_query_then_fetch
:arg seq_no_primary_term: Specify whether to return sequence
number and primary term of the last modification of each hit
:arg size: Number of hits to return (default: 10)
:arg sort: A comma-separated list of <field>:<direction> pairs
:arg stats: Specific 'tag' of the request for logging and
statistical purposes
:arg stored_fields: A comma-separated list of stored fields to
return as part of a hit
:arg suggest_field: Specify which field to use for suggestions
2020-06-03 10:38:35 -05:00
:arg suggest_mode: Specify suggest mode Valid choices: missing,
popular, always Default: missing
2020-05-15 09:36:47 -05:00
:arg suggest_size: How many suggestions to return in response
:arg suggest_text: The source text for which the suggestions
should be returned
:arg terminate_after: The maximum number of documents to collect
for each shard, upon reaching which the query execution will terminate
early.
:arg timeout: Explicit operation timeout
:arg track_scores: Whether to calculate and return scores even
if they are not used for sorting
:arg track_total_hits: Indicate if the number of documents that
match the query should be tracked
:arg typed_keys: Specify whether aggregation and suggester names
should be prefixed by their respective types in the response
:arg version: Specify whether to return document version as part
of a hit
"""
# from is a reserved word so it cannot be used, use from_ instead
if "from_" in params:
params["from"] = params.pop("from_")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_search"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params(
"allow_no_indices",
"expand_wildcards",
"ignore_unavailable",
"local",
"preference",
"routing",
)
2020-05-20 12:34:29 -05:00
async def search_shards(self, index=None, params=None, headers=None):
2020-05-15 09:36:47 -05:00
"""
Returns information about the indices and shards that a search request would be
executed against.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg local: Return local information, do not retrieve the state
from master node (default: false)
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg routing: Specific routing value
"""
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"GET", _make_path(index, "_search_shards"), params=params, headers=headers
)
@query_params(
"allow_no_indices",
"ccs_minimize_roundtrips",
"expand_wildcards",
"explain",
"ignore_throttled",
"ignore_unavailable",
"preference",
"profile",
"rest_total_hits_as_int",
"routing",
"scroll",
"search_type",
"typed_keys",
)
2020-05-20 12:34:29 -05:00
async def search_template(
self, body, index=None, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Allows to use the Mustache language to pre-render a search definition.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg body: The search definition template and its params
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of document types to
search; leave empty to perform the operation on all types
2020-05-15 09:36:47 -05:00
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg ccs_minimize_roundtrips: Indicates whether network round-
trips should be minimized as part of cross-cluster search requests
2020-06-03 10:38:35 -05:00
execution Default: true
2020-05-15 09:36:47 -05:00
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-15 09:36:47 -05:00
:arg explain: Specify whether to return detailed information
about score computation as part of a hit
:arg ignore_throttled: Whether specified concrete, expanded or
aliased indices should be ignored when throttled
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg profile: Specify whether to profile the query execution
:arg rest_total_hits_as_int: Indicates whether hits.total should
be rendered as an integer or an object in the rest search response
:arg routing: A comma-separated list of specific routing values
:arg scroll: Specify how long a consistent view of the index
should be maintained for scrolled search
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2021-05-03 10:30:13 -05:00
query_then_fetch, dfs_query_then_fetch
2020-05-15 09:36:47 -05:00
:arg typed_keys: Specify whether aggregation and suggester names
should be prefixed by their respective types in the response
"""
if body in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'body'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_search", "template"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
@query_params(
"field_statistics",
"fields",
"offsets",
"payloads",
"positions",
"preference",
"realtime",
"routing",
"term_statistics",
"version",
"version_type",
)
2020-05-20 12:34:29 -05:00
async def termvectors(
self, index, body=None, doc_type=None, id=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Returns information and statistics about terms in the fields of a particular
document.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: The index in which the document resides.
:arg body: Define parameters and or supply a document to get
termvectors for. See documentation.
2020-05-20 12:34:29 -05:00
:arg doc_type: The type of the document.
2020-05-15 09:36:47 -05:00
:arg id: The id of the document, when not specified a doc param
should be supplied.
:arg field_statistics: Specifies if document count, sum of
document frequencies and sum of total term frequencies should be
2020-06-03 10:38:35 -05:00
returned. Default: True
2020-05-15 09:36:47 -05:00
:arg fields: A comma-separated list of fields to return.
:arg offsets: Specifies if term offsets should be returned.
Default: True
:arg payloads: Specifies if term payloads should be returned.
Default: True
:arg positions: Specifies if term positions should be returned.
Default: True
:arg preference: Specify the node or shard the operation should
be performed on (default: random).
:arg realtime: Specifies if request is real-time as opposed to
near-real-time (default: true).
:arg routing: Specific routing value.
:arg term_statistics: Specifies if total term frequency and
document frequency should be returned.
:arg version: Explicit version number for concurrency control
2020-06-03 10:38:35 -05:00
:arg version_type: Specific version type Valid choices:
2020-05-20 12:34:29 -05:00
internal, external, external_gte, force
2020-05-15 09:36:47 -05:00
"""
if index in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'index'.")
2020-05-20 12:34:29 -05:00
if doc_type in SKIP_IN_PATH:
2020-05-21 14:57:59 -05:00
path = _make_path(index, "_termvectors", id)
else:
path = _make_path(index, doc_type, id, "_termvectors")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"POST", path, params=params, headers=headers, body=body
2020-05-20 12:34:29 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"if_primary_term",
"if_seq_no",
"lang",
"refresh",
2020-07-29 15:51:19 -05:00
"require_alias",
2020-05-20 12:34:29 -05:00
"retry_on_conflict",
"routing",
"timeout",
"wait_for_active_shards",
)
async def update(self, index, id, body, doc_type=None, params=None, headers=None):
"""
Updates a document with a script or partial document.
2020-10-20 13:02:15 -05:00
2020-05-20 12:34:29 -05:00
:arg index: The name of the index
:arg id: Document ID
:arg body: The request definition requires either `script` or
partial `doc`
:arg doc_type: The type of the document
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg if_primary_term: only perform the update operation if the
last operation that has changed the document has the specified primary
term
:arg if_seq_no: only perform the update operation if the last
operation that has changed the document has the specified sequence
number
:arg lang: The script language (default: painless)
:arg refresh: If `true` then refresh the affected shards to make
this operation visible to search, if `wait_for` then wait for a refresh
to make this operation visible to search, if `false` (the default) then
2020-06-03 10:38:35 -05:00
do nothing with refreshes. Valid choices: true, false, wait_for
2020-07-29 15:51:19 -05:00
:arg require_alias: When true, requires destination is an alias.
Default is false
2020-05-20 12:34:29 -05:00
:arg retry_on_conflict: Specify how many times should the
operation be retried when a conflict occurs (default: 0)
:arg routing: Specific routing value
:arg timeout: Explicit operation timeout
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the update operation.
Defaults to 1, meaning the primary shard only. Set to `all` for all
shard copies, otherwise set to any non-negative value less than or equal
to the total number of copies for the shard (number of replicas + 1)
"""
for param in (index, id, body):
if param in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument.")
if doc_type in SKIP_IN_PATH:
2020-05-21 14:57:59 -05:00
path = _make_path(index, "_update", id)
else:
path = _make_path(index, doc_type, id, "_update")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-21 14:57:59 -05:00
"POST", path, params=params, headers=headers, body=body
2020-05-15 09:36:47 -05:00
)
@query_params(
"_source",
"_source_excludes",
"_source_includes",
"allow_no_indices",
"analyze_wildcard",
"analyzer",
"conflicts",
"default_operator",
"df",
"expand_wildcards",
"from_",
"ignore_unavailable",
"lenient",
"max_docs",
"pipeline",
"preference",
"q",
"refresh",
"request_cache",
"requests_per_second",
"routing",
"scroll",
"scroll_size",
"search_timeout",
"search_type",
2020-05-20 12:34:29 -05:00
"size",
2020-05-15 09:36:47 -05:00
"slices",
"sort",
"stats",
"terminate_after",
"timeout",
"version",
"version_type",
"wait_for_active_shards",
"wait_for_completion",
)
2020-05-20 12:34:29 -05:00
async def update_by_query(
self, index, body=None, doc_type=None, params=None, headers=None
):
2020-05-15 09:36:47 -05:00
"""
Performs an update on every document in the index without changing the source,
for example to pick up a mapping change.
2020-10-20 13:02:15 -05:00
2020-05-15 09:36:47 -05:00
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
:arg body: The search definition using the Query DSL
2020-05-20 12:34:29 -05:00
:arg doc_type: A comma-separated list of document types to
search; leave empty to perform the operation on all types
2020-05-15 09:36:47 -05:00
:arg _source: True or false to return the _source field or not,
or a list of fields to return
:arg _source_excludes: A list of fields to exclude from the
returned _source field
:arg _source_includes: A list of fields to extract and return
from the _source field
:arg allow_no_indices: Whether to ignore if a wildcard indices
expression resolves into no concrete indices. (This includes `_all`
string or when no indices have been specified)
:arg analyze_wildcard: Specify whether wildcard and prefix
queries should be analyzed (default: false)
:arg analyzer: The analyzer to use for the query string
:arg conflicts: What to do when the update by query hits version
2020-06-03 10:38:35 -05:00
conflicts? Valid choices: abort, proceed Default: abort
2020-05-15 09:36:47 -05:00
:arg default_operator: The default operator for query string
2020-06-03 10:38:35 -05:00
query (AND or OR) Valid choices: AND, OR Default: OR
2020-05-15 09:36:47 -05:00
:arg df: The field to use as default where no field prefix is
given in the query string
:arg expand_wildcards: Whether to expand wildcard expression to
2020-06-03 10:38:35 -05:00
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
2020-05-20 12:34:29 -05:00
:arg from_: Starting offset (default: 0)
2020-05-15 09:36:47 -05:00
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg lenient: Specify whether format-based query failures (such
as providing text to a numeric field) should be ignored
:arg max_docs: Maximum number of documents to process (default:
all documents)
:arg pipeline: Ingest pipeline to set on index requests made by
this action. (default: none)
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg q: Query in the Lucene query string syntax
:arg refresh: Should the affected indexes be refreshed?
:arg request_cache: Specify if request cache should be used for
this request or not, defaults to index level setting
:arg requests_per_second: The throttle to set on this request in
sub-requests per second. -1 means no throttle.
:arg routing: A comma-separated list of specific routing values
:arg scroll: Specify how long a consistent view of the index
should be maintained for scrolled search
:arg scroll_size: Size on the scroll request powering the update
2020-06-03 10:38:35 -05:00
by query Default: 100
2020-05-15 09:36:47 -05:00
:arg search_timeout: Explicit timeout for each search request.
Defaults to no timeout.
2020-06-03 10:38:35 -05:00
:arg search_type: Search operation type Valid choices:
2020-05-15 09:36:47 -05:00
query_then_fetch, dfs_query_then_fetch
2020-05-20 12:34:29 -05:00
:arg size: Deprecated, please use `max_docs` instead
2020-05-15 09:36:47 -05:00
:arg slices: The number of slices this task should be divided
into. Defaults to 1, meaning the task isn't sliced into subtasks. Can be
2020-06-03 10:38:35 -05:00
set to `auto`. Default: 1
2020-05-15 09:36:47 -05:00
:arg sort: A comma-separated list of <field>:<direction> pairs
:arg stats: Specific 'tag' of the request for logging and
statistical purposes
:arg terminate_after: The maximum number of documents to collect
for each shard, upon reaching which the query execution will terminate
early.
:arg timeout: Time each individual bulk request should wait for
2020-06-03 10:38:35 -05:00
shards that are unavailable. Default: 1m
2020-05-15 09:36:47 -05:00
:arg version: Specify whether to return document version as part
of a hit
:arg version_type: Should the document increment the version
number (internal) on hit or not (reindex)
:arg wait_for_active_shards: Sets the number of shard copies
that must be active before proceeding with the update by query
operation. Defaults to 1, meaning the primary shard only. Set to `all`
for all shard copies, otherwise set to any non-negative value less than
or equal to the total number of copies for the shard (number of replicas
+ 1)
:arg wait_for_completion: Should the request should block until
2020-06-03 10:38:35 -05:00
the update by query operation is complete. Default: True
2020-05-15 09:36:47 -05:00
"""
# from is a reserved word so it cannot be used, use from_ instead
if "from_" in params:
params["from"] = params.pop("from_")
if index in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'index'.")
2020-05-20 12:34:29 -05:00
return await self.transport.perform_request(
2020-05-15 09:36:47 -05:00
"POST",
2020-05-20 12:34:29 -05:00
_make_path(index, doc_type, "_update_by_query"),
2020-05-15 09:36:47 -05:00
params=params,
headers=headers,
body=body,
)
2020-05-20 12:34:29 -05:00
@query_params("requests_per_second")
async def update_by_query_rethrottle(self, task_id, params=None, headers=None):
"""
Changes the number of requests per second for a particular Update By Query
operation.
2020-10-20 13:02:15 -05:00
2020-05-20 12:34:29 -05:00
:arg task_id: The task id to rethrottle
:arg requests_per_second: The throttle to set on this request in
floating sub-requests per second. -1 means set no throttle.
"""
if task_id in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'task_id'.")
return await self.transport.perform_request(
"POST",
_make_path("_update_by_query", task_id, "_rethrottle"),
params=params,
headers=headers,
)
@query_params()
async def get_script_context(self, params=None, headers=None):
"""
Returns all script contexts.
2020-10-20 13:02:15 -05:00
.. warning::
This API is **experimental** so may include breaking changes
or be removed in a future version
2020-05-20 12:34:29 -05:00
"""
return await self.transport.perform_request(
"GET", "/_script_context", params=params, headers=headers
)
@query_params()
async def get_script_languages(self, params=None, headers=None):
"""
Returns available script types, languages and contexts
2020-10-20 13:02:15 -05:00
.. warning::
This API is **experimental** so may include breaking changes
or be removed in a future version
2020-05-20 12:34:29 -05:00
"""
return await self.transport.perform_request(
"GET", "/_script_language", params=params, headers=headers
)
2020-08-31 11:07:40 -05:00
@query_params()
async def close_point_in_time(self, body=None, params=None, headers=None):
"""
Close a point in time
2020-10-20 13:02:15 -05:00
2020-08-31 11:07:40 -05:00
:arg body: a point-in-time id to close
"""
return await self.transport.perform_request(
"DELETE", "/_pit", params=params, headers=headers, body=body
)
@query_params(
"expand_wildcards", "ignore_unavailable", "keep_alive", "preference", "routing"
)
async def open_point_in_time(self, index=None, params=None, headers=None):
"""
Open a point in time that can be used in subsequent searches
2020-10-20 13:02:15 -05:00
2020-08-31 11:07:40 -05:00
:arg index: A comma-separated list of index names to open point
in time; use `_all` or empty string to perform the operation on all
indices
:arg expand_wildcards: Whether to expand wildcard expression to
concrete indices that are open, closed or both. Valid choices: open,
closed, hidden, none, all Default: open
:arg ignore_unavailable: Whether specified concrete indices
should be ignored when unavailable (missing or closed)
:arg keep_alive: Specific the time to live for the point in time
:arg preference: Specify the node or shard the operation should
be performed on (default: random)
:arg routing: Specific routing value
"""
return await self.transport.perform_request(
"POST", _make_path(index, "_pit"), params=params, headers=headers
)
2021-06-04 10:17:58 -05:00
@query_params()
async def terms_enum(self, index, body=None, params=None, headers=None):
"""
The terms enum API can be used to discover terms in the index that begin with
the provided string. It is designed for low-latency look-ups used in auto-
complete scenarios.
.. warning::
This API is **beta** so may include breaking changes
or be removed in a future version
:arg index: A comma-separated list of index names to search; use
`_all` or empty string to perform the operation on all indices
:arg body: field name, string which is the prefix expected in
matching terms, timeout and size for max number of results
"""
if index in SKIP_IN_PATH:
raise ValueError("Empty value passed for a required argument 'index'.")
return await self.transport.perform_request(
"POST",
_make_path(index, "_terms_enum"),
params=params,
headers=headers,
body=body,
)