6e3f1a1194
* Upgrade syntax with pyupgrade --py38-plus Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> * Convert to f-strings with flynt Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> * Format with Black Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> * Remove redundant mock backport dependency Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> * isort imports Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> * Add changelog entry Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com> --------- Signed-off-by: Hugo van Kemenade <1324225+hugovk@users.noreply.github.com>
215 lines
6.3 KiB
Python
215 lines
6.3 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
#
|
|
# The OpenSearch Contributors require contributions made to
|
|
# this file be licensed under the Apache-2.0 license or a
|
|
# compatible open source license.
|
|
#
|
|
# Modifications Copyright OpenSearch Contributors. See
|
|
# GitHub history for details.
|
|
#
|
|
# Licensed to Elasticsearch B.V. under one or more contributor
|
|
# license agreements. See the NOTICE file distributed with
|
|
# this work for additional information regarding copyright
|
|
# ownership. Elasticsearch B.V. licenses this file to you under
|
|
# the Apache License, Version 2.0 (the "License"); you may
|
|
# not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
|
|
from typing import Any, Dict, Optional
|
|
|
|
try:
|
|
import simplejson as json
|
|
except ImportError:
|
|
import json # type: ignore
|
|
|
|
import uuid
|
|
from datetime import date, datetime
|
|
from decimal import Decimal
|
|
|
|
from .compat import string_types
|
|
from .exceptions import ImproperlyConfigured, SerializationError
|
|
from .helpers.utils import AttrList
|
|
|
|
INTEGER_TYPES = ()
|
|
FLOAT_TYPES = (Decimal,)
|
|
TIME_TYPES = (date, datetime)
|
|
|
|
|
|
class Serializer:
|
|
mimetype: str = ""
|
|
|
|
def loads(self, s: str) -> Any:
|
|
raise NotImplementedError()
|
|
|
|
def dumps(self, data: Any) -> Any:
|
|
raise NotImplementedError()
|
|
|
|
|
|
class TextSerializer(Serializer):
|
|
mimetype: str = "text/plain"
|
|
|
|
def loads(self, s: str) -> Any:
|
|
return s
|
|
|
|
def dumps(self, data: Any) -> Any:
|
|
if isinstance(data, string_types):
|
|
return data
|
|
|
|
raise SerializationError(f"Cannot serialize {data!r} into text.")
|
|
|
|
|
|
class JSONSerializer(Serializer):
|
|
mimetype: str = "application/json"
|
|
|
|
def default(self, data: Any) -> Any:
|
|
if isinstance(data, TIME_TYPES):
|
|
# Little hack to avoid importing pandas but to not
|
|
# return 'NaT' string for pd.NaT as that's not a valid
|
|
# date.
|
|
formatted_data = data.isoformat()
|
|
if formatted_data != "NaT":
|
|
return formatted_data
|
|
|
|
if isinstance(data, uuid.UUID):
|
|
return str(data)
|
|
elif isinstance(data, FLOAT_TYPES):
|
|
return float(data)
|
|
elif INTEGER_TYPES and isinstance(data, INTEGER_TYPES):
|
|
return int(data)
|
|
|
|
# Special cases for numpy and pandas types
|
|
# These are expensive to import so we try them last.
|
|
try:
|
|
import numpy as np
|
|
|
|
if isinstance(
|
|
data,
|
|
(
|
|
np.int_,
|
|
np.intc,
|
|
np.int8,
|
|
np.int16,
|
|
np.int32,
|
|
np.int64,
|
|
np.uint8,
|
|
np.uint16,
|
|
np.uint32,
|
|
np.uint64,
|
|
),
|
|
):
|
|
return int(data)
|
|
elif isinstance(
|
|
data,
|
|
(
|
|
np.float16,
|
|
np.float32,
|
|
np.float64,
|
|
),
|
|
):
|
|
return float(data)
|
|
elif isinstance(data, np.bool_):
|
|
return bool(data)
|
|
elif isinstance(data, np.datetime64):
|
|
return data.item().isoformat()
|
|
elif isinstance(data, np.ndarray):
|
|
return data.tolist()
|
|
except ImportError:
|
|
pass
|
|
|
|
try:
|
|
import pandas as pd
|
|
|
|
if isinstance(data, (pd.Series, pd.Categorical)):
|
|
return data.tolist()
|
|
elif isinstance(data, pd.Timestamp) and data is not getattr(
|
|
pd, "NaT", None
|
|
):
|
|
return data.isoformat()
|
|
elif data is getattr(pd, "NA", None):
|
|
return None
|
|
except ImportError:
|
|
pass
|
|
|
|
raise TypeError(f"Unable to serialize {data!r} (type: {type(data)})")
|
|
|
|
def loads(self, s: str) -> Any:
|
|
try:
|
|
return json.loads(s)
|
|
except (ValueError, TypeError) as e:
|
|
raise SerializationError(s, e)
|
|
|
|
def dumps(self, data: Any) -> Any:
|
|
# don't serialize strings
|
|
if isinstance(data, string_types):
|
|
return data
|
|
|
|
try:
|
|
return json.dumps(
|
|
data, default=self.default, ensure_ascii=False, separators=(",", ":")
|
|
)
|
|
except (ValueError, TypeError) as e:
|
|
raise SerializationError(data, e)
|
|
|
|
|
|
DEFAULT_SERIALIZERS: Dict[str, Serializer] = {
|
|
JSONSerializer.mimetype: JSONSerializer(),
|
|
TextSerializer.mimetype: TextSerializer(),
|
|
}
|
|
|
|
|
|
class Deserializer:
|
|
def __init__(
|
|
self,
|
|
serializers: Dict[str, Serializer],
|
|
default_mimetype: str = "application/json",
|
|
) -> None:
|
|
try:
|
|
self.default = serializers[default_mimetype]
|
|
except KeyError:
|
|
raise ImproperlyConfigured(
|
|
f"Cannot find default serializer ({default_mimetype})"
|
|
)
|
|
self.serializers = serializers
|
|
|
|
def loads(self, s: str, mimetype: Optional[str] = None) -> Any:
|
|
if not mimetype:
|
|
deserializer = self.default
|
|
else:
|
|
# Treat 'application/vnd.elasticsearch+json'
|
|
# as application/json for compatibility.
|
|
if mimetype == "application/vnd.elasticsearch+json":
|
|
mimetype = "application/json"
|
|
|
|
# split out charset
|
|
mimetype, _, _ = mimetype.partition(";")
|
|
try:
|
|
deserializer = self.serializers[mimetype]
|
|
except KeyError:
|
|
raise SerializationError(
|
|
f"Unknown mimetype, unable to deserialize: {mimetype}"
|
|
)
|
|
|
|
return deserializer.loads(s)
|
|
|
|
|
|
class AttrJSONSerializer(JSONSerializer):
|
|
def default(self, data: Any) -> Any:
|
|
if isinstance(data, AttrList):
|
|
return data._l_
|
|
if hasattr(data, "to_dict"):
|
|
return data.to_dict()
|
|
return super().default(data)
|
|
|
|
|
|
serializer = AttrJSONSerializer()
|