Files
opensearch-orm/opensearchorm/query.py
2022-09-21 22:05:04 +08:00

175 lines
4.3 KiB
Python

import abc
from enum import Enum
import logging
from typing import List, Optional, Type, TypeVar, Union
from opensearchorm.model import BaseModel
Model = TypeVar('Model', bound=BaseModel)
class Expr(abc.ABC):
@abc.abstractmethod
def compile(self) -> dict:
...
class Contains(Expr):
def __init__(self, field: str, values: list):
self.field = field
self.values = values
def compile(self):
return {
'bool': {
'should': [MatchPhrase(self.field, v).compile() for v in self.values],
'minimum_should_match': 1,
}
}
class Range(Expr):
def __init__(self, field: str, value: Union[str, int], operator: str):
self.field = field
self.op = operator
self.value = value
def compile(self):
return {
'range': {
self.field: {
self.op: self.value,
}
}
}
class MatchPhrase(Expr):
def __init__(self, field: str, value: str):
self.field = field
self.value = value
def compile(self):
return {
'match_phrase': {
self.field: self.value,
}
}
class Prefix(Expr):
def __init__(self, field: str, value: str):
self.field = field
self.value = value
def compile(self):
return {
'prefix': {
self.field: self.value,
}
}
class Wildcard(Expr):
def __init__(self, field: str, value: str):
self.field = field
self.value = value
def compile(self):
return {
'wildcard': {
self.field: self.value,
}
}
class RegExp(Expr):
def __init__(self, field: str, value: str):
self.field = field
self.value = value
def compile(self):
return {
'regexp': {
self.field: self.value,
}
}
class Operator(Enum):
PREFIX = '__prefix'
REGEXP = '__regexp'
CONTAINS = '__contains'
GTE = '__gte'
GT = '__gt'
LTE = '__lte'
LT = '__lt'
class ModelQuery(Expr):
def __init__(self, model_cls: Type[Model]):
self.__model_cls = model_cls
self.__filter: List[Expr] = []
self.__exclude: List[Expr] = []
self.__union: List[Expr] = []
def compile(self):
return {
'bool': {
'must_not': [e.compile() for e in self.__exclude],
'should': [e.compile() for e in self.__union],
'filter': [e.compile() for e in self.__filter],
}
}
def parse_clause(self, raw_field: str, value) -> Expr:
field = raw_field
for op in Operator:
suffix: str = op.value
if raw_field.endswith(suffix):
field = raw_field.removesuffix(suffix)
logging.debug('parse field: %s, raw: %s', field, raw_field)
if op == Operator.CONTAINS:
return Contains(field, value)
elif op == Operator.PREFIX:
return Prefix(field, value)
elif op == Operator.REGEXP:
return RegExp(field, value)
elif op in (Operator.GTE, Operator.GT, Operator.LTE, Operator.LT):
op = suffix.lstrip('_')
return Range(field, value, op)
model = self.__model_cls
valid_fields = set(model.default_fields())
assert field in valid_fields, f'check field name: {field}'
return MatchPhrase(field, value)
def parse_clauses(self, **kwargs):
clauses = []
for k, v in kwargs.items():
cond = self.parse_clause(k, v)
clauses.append(cond)
return clauses
def filter(self, *args: Expr, **kwargs):
conditions = self.parse_clauses(**kwargs)
self.__filter.extend(args)
self.__filter.extend(conditions)
return self
def union(self, *args: Expr, **kwargs):
conditions = self.parse_clauses(**kwargs)
self.__union.extend(args)
self.__union.extend(conditions)
return self
def exclude(self, *args: Expr, **kwargs):
conditions = self.parse_clauses(**kwargs)
self.__exclude.extend(args)
self.__exclude.extend(conditions)
return self