dcb79cc322
* Merged types into .py code. Signed-off-by: dblock <dblock@amazon.com> * Fix: nox -rs generate. Signed-off-by: dblock <dblock@amazon.com> * Updated CHANGELOG. Signed-off-by: dblock <dblock@amazon.com> * Use lowest common python version for lint. Signed-off-by: dblock <dblock@amazon.com> * Fix: don't typeshed. Signed-off-by: dblock <dblock@amazon.com> * Removed unneeded comment. Signed-off-by: dblock <dblock@amazon.com> * Simplify OPENSEARCH_URL. Signed-off-by: dblock <dblock@amazon.com> * Fix: positional ignore_status used as chunk_size. Signed-off-by: dblock <dblock@amazon.com> * Fix: parse version string. Signed-off-by: dblock <dblock@amazon.com> * Remove future annotations for Python 3.6. Signed-off-by: dblock <dblock@amazon.com> * Fix: types in documentation. Signed-off-by: dblock <dblock@amazon.com> * Improve CHANGELOG text. Signed-off-by: dblock <dblock@amazon.com> * Re-added missing separator. Signed-off-by: dblock <dblock@amazon.com> * Remove duplicate licenses. Signed-off-by: dblock <dblock@amazon.com> * Get rid of Optional[Any]. Signed-off-by: dblock <dblock@amazon.com> * Fix docs with AsyncOpenSearch. Signed-off-by: dblock <dblock@amazon.com> * Fix: undo comment. Signed-off-by: dblock <dblock@amazon.com> --------- Signed-off-by: dblock <dblock@amazon.com>
171 lines
5.6 KiB
Python
171 lines
5.6 KiB
Python
# -*- coding: utf-8 -*-
|
|
# SPDX-License-Identifier: Apache-2.0
|
|
#
|
|
# The OpenSearch Contributors require contributions made to
|
|
# this file be licensed under the Apache-2.0 license or a
|
|
# compatible open source license.
|
|
#
|
|
# Modifications Copyright OpenSearch Contributors. See
|
|
# GitHub history for details.
|
|
|
|
import collections.abc as collections_abc
|
|
from itertools import chain
|
|
from typing import Any
|
|
|
|
from six import iteritems
|
|
|
|
from opensearchpy.connection.async_connections import get_connection
|
|
from opensearchpy.helpers.field import Nested, Text
|
|
from opensearchpy.helpers.mapping import META_FIELDS, Properties
|
|
|
|
|
|
class AsyncMapping(object):
|
|
_meta: Any
|
|
properties: Properties
|
|
|
|
def __init__(self) -> None:
|
|
self.properties = Properties()
|
|
self._meta = {}
|
|
|
|
def __repr__(self) -> str:
|
|
return "Mapping()"
|
|
|
|
def _clone(self) -> Any:
|
|
m = AsyncMapping()
|
|
m.properties._params = self.properties._params.copy()
|
|
return m
|
|
|
|
@classmethod
|
|
async def from_opensearch(cls, index: Any, using: str = "default") -> Any:
|
|
m = cls()
|
|
await m.update_from_opensearch(index, using)
|
|
return m
|
|
|
|
def resolve_nested(self, field_path: str) -> Any:
|
|
field = self
|
|
nested = []
|
|
parts = field_path.split(".")
|
|
for i, step in enumerate(parts):
|
|
try:
|
|
field = field[step]
|
|
except KeyError:
|
|
return (), None
|
|
if isinstance(field, Nested):
|
|
nested.append(".".join(parts[: i + 1]))
|
|
return nested, field
|
|
|
|
def resolve_field(self, field_path: Any) -> Any:
|
|
field = self
|
|
for step in field_path.split("."):
|
|
try:
|
|
field = field[step]
|
|
except KeyError:
|
|
return None
|
|
return field
|
|
|
|
def _collect_analysis(self) -> Any:
|
|
analysis: Any = {}
|
|
fields: Any = []
|
|
if "_all" in self._meta:
|
|
fields.append(Text(**self._meta["_all"]))
|
|
|
|
for f in chain(fields, self.properties._collect_fields()):
|
|
for analyzer_name in (
|
|
"analyzer",
|
|
"normalizer",
|
|
"search_analyzer",
|
|
"search_quote_analyzer",
|
|
):
|
|
if not hasattr(f, analyzer_name):
|
|
continue
|
|
analyzer = getattr(f, analyzer_name)
|
|
d = analyzer.get_analysis_definition()
|
|
# empty custom analyzer, probably already defined out of our control
|
|
if not d:
|
|
continue
|
|
|
|
# merge the definition
|
|
# TODO: conflict detection/resolution
|
|
for key in d:
|
|
analysis.setdefault(key, {}).update(d[key])
|
|
|
|
return analysis
|
|
|
|
async def save(self, index: Any, using: str = "default") -> Any:
|
|
from opensearchpy._async.helpers.index import AsyncIndex
|
|
|
|
index = AsyncIndex(index, using=using)
|
|
index.mapping(self)
|
|
return await index.save()
|
|
|
|
async def update_from_opensearch(self, index: Any, using: str = "default") -> None:
|
|
opensearch = await get_connection(using)
|
|
raw = await opensearch.indices.get_mapping(index=index)
|
|
_, raw = raw.popitem()
|
|
self._update_from_dict(raw["mappings"])
|
|
|
|
def _update_from_dict(self, raw: Any) -> None:
|
|
for name, definition in iteritems(raw.get("properties", {})):
|
|
self.field(name, definition)
|
|
|
|
# metadata like _all etc
|
|
for name, value in iteritems(raw):
|
|
if name != "properties":
|
|
if isinstance(value, collections_abc.Mapping):
|
|
self.meta(name, **value)
|
|
else:
|
|
self.meta(name, value)
|
|
|
|
def update(self, mapping: Any, update_only: bool = False) -> None:
|
|
for name in mapping:
|
|
if update_only and name in self:
|
|
# nested and inner objects, merge recursively
|
|
if hasattr(self[name], "update"):
|
|
# FIXME only merge subfields, not the settings
|
|
self[name].update(mapping[name], update_only)
|
|
continue
|
|
self.field(name, mapping[name])
|
|
|
|
if update_only:
|
|
for name in mapping._meta:
|
|
if name not in self._meta:
|
|
self._meta[name] = mapping._meta[name]
|
|
else:
|
|
self._meta.update(mapping._meta)
|
|
|
|
def __contains__(self, name: Any) -> bool:
|
|
return name in self.properties.properties
|
|
|
|
def __getitem__(self, name: Any) -> Any:
|
|
return self.properties.properties[name]
|
|
|
|
def __iter__(self) -> Any:
|
|
return iter(self.properties.properties)
|
|
|
|
def field(self, *args: Any, **kwargs: Any) -> "AsyncMapping":
|
|
self.properties.field(*args, **kwargs)
|
|
return self
|
|
|
|
def meta(self, name: Any, params: Any = None, **kwargs: Any) -> "AsyncMapping":
|
|
if not name.startswith("_") and name not in META_FIELDS:
|
|
name = "_" + name
|
|
|
|
if params and kwargs:
|
|
raise ValueError("Meta configs cannot have both value and a dictionary.")
|
|
|
|
self._meta[name] = kwargs if params is None else params
|
|
return self
|
|
|
|
def to_dict(self) -> Any:
|
|
meta = self._meta
|
|
|
|
# hard coded serialization of analyzers in _all
|
|
if "_all" in meta:
|
|
meta = meta.copy()
|
|
_all = meta["_all"] = meta["_all"].copy()
|
|
for f in ("analyzer", "search_analyzer", "search_quote_analyzer"):
|
|
if hasattr(_all.get(f, None), "to_dict"):
|
|
_all[f] = _all[f].to_dict()
|
|
meta.update(self.properties.to_dict())
|
|
return meta
|