grung-db/src/grung/types.py

197 lines
5.6 KiB
Python
Raw Normal View History

2025-09-27 15:13:17 -07:00
from __future__ import annotations
2025-09-24 19:51:39 -07:00
from collections import namedtuple
from dataclasses import dataclass, field
2025-09-27 15:13:17 -07:00
from typing import Dict, List
2025-09-24 19:51:39 -07:00
import nanoid
from tinydb import TinyDB, where
2025-09-27 15:13:17 -07:00
from grung.exceptions import PointerReferenceError
2025-09-24 19:51:39 -07:00
2025-09-29 23:10:33 -07:00
Metadata = namedtuple("Metadata", ["table", "fields", "backrefs"])
2025-09-24 19:51:39 -07:00
@dataclass
class Field:
"""
Represents a single field in a Record.
"""
name: str
value_type: type = str
default: str = None
2025-09-24 19:51:39 -07:00
unique: bool = False
2025-09-29 23:10:33 -07:00
def before_insert(self, value: value_type, db: TinyDB, record: Record) -> None:
pass
def after_insert(self, db: TinyDB, record: Record) -> None:
pass
2025-09-27 15:13:17 -07:00
2025-09-29 23:10:33 -07:00
def serialize(self, value: value_type) -> str:
if value is not None:
return str(value)
def deserialize(self, value: value_type, db: TinyDB, recurse: bool = True) -> value_type:
return value
2025-09-27 15:13:17 -07:00
@dataclass
2025-09-27 15:13:17 -07:00
class Integer(Field):
2025-09-29 23:10:33 -07:00
value_type = int
default: int = 0
2025-09-27 15:13:17 -07:00
2025-09-29 23:10:33 -07:00
def deserialize(self, value: str, db: TinyDB, recurse: bool = True) -> value_type:
return int(value)
2025-09-27 15:13:17 -07:00
2025-09-24 19:51:39 -07:00
2025-09-27 15:13:17 -07:00
class Record(Dict[(str, Field)]):
2025-09-24 19:51:39 -07:00
"""
Base type for a single database record.
"""
def __init__(self, raw_doc: dict = {}, doc_id: int = None, **params):
self.doc_id = doc_id
fields = self.__class__.fields()
2025-09-29 23:10:33 -07:00
self._metadata = Metadata(
table=self.__class__.__name__,
fields={f.name: f for f in fields},
backrefs=lambda value_type: (
field for field in fields if type(field) == BackReference and field.value_type == value_type
),
)
super().__init__(dict({field.name: field.default for field in fields}, **raw_doc, **params))
@classmethod
def fields(self):
return [
2025-09-24 19:51:39 -07:00
# 1% collision rate at ~2M records
Field("uid", default=nanoid.generate(size=8), unique=True)
]
2025-09-24 19:51:39 -07:00
2025-09-29 23:10:33 -07:00
def serialize(self):
2025-09-27 15:13:17 -07:00
"""
Serialie every field on the record
"""
rec = {}
2025-09-28 11:11:34 -07:00
for name, _field in self._metadata.fields.items():
2025-09-29 23:10:33 -07:00
rec[name] = _field.serialize(self[name])
2025-09-27 15:13:17 -07:00
return self.__class__(rec, doc_id=self.doc_id)
2025-09-28 12:00:19 -07:00
def deserialize(self, db, recurse: bool = True):
2025-09-27 15:13:17 -07:00
"""
Deserialize every field on the record
"""
rec = {}
2025-09-28 11:11:34 -07:00
for name, _field in self._metadata.fields.items():
2025-09-28 12:00:19 -07:00
rec[name] = _field.deserialize(self[name], db, recurse=recurse)
2025-09-27 15:13:17 -07:00
return self.__class__(rec, doc_id=self.doc_id)
2025-09-29 23:10:33 -07:00
def before_insert(self, db: TinyDB) -> None:
for name, _field in self._metadata.fields.items():
_field.before_insert(self[name], db, self)
def after_insert(self, db: TinyDB) -> None:
for name, _field in self._metadata.fields.items():
_field.after_insert(db, self)
2025-09-28 11:23:38 -07:00
2025-09-24 19:51:39 -07:00
def __setattr__(self, key, value):
if key in self:
self[key] = value
super().__setattr__(key, value)
def __getattr__(self, attr_name):
if attr_name in self:
return self.get(attr_name)
return super().__getattr__(attr_name)
def __hash__(self):
return hash(str(dict(self)))
2025-09-24 19:51:39 -07:00
def __repr__(self):
2025-09-29 23:10:33 -07:00
return (
f"{self.__class__.__name__}[{self.doc_id}]("
+ ", ".join([f"{key}={val}" for (key, val) in self.items()])
+ ")"
)
2025-09-27 15:13:17 -07:00
2025-09-28 14:08:50 -07:00
@dataclass
class Pointer(Field):
"""
Store a string reference to a record.
"""
name: str = ""
value_type: type = Record
2025-09-29 23:10:33 -07:00
def serialize(self, value: value_type) -> str:
2025-09-29 23:40:25 -07:00
return Pointer.reference(value)
def deserialize(self, value: str, db: TinyDB, recurse: bool = True) -> value_type:
return Pointer.dereference(value, db, recurse)
@classmethod
def reference(cls, value: Record):
2025-09-28 14:08:50 -07:00
if value:
if not value.doc_id:
raise PointerReferenceError(value)
return f"{value._metadata.table}::{value.uid}"
2025-09-29 23:10:33 -07:00
return None
2025-09-28 14:08:50 -07:00
2025-09-29 23:10:33 -07:00
@classmethod
def dereference(cls, value: str, db: TinyDB, recurse: bool = True):
if not value:
return
elif type(value) == str:
2025-09-28 14:14:06 -07:00
pt, puid = value.split("::")
if puid:
return db.table(pt).search(where("uid") == puid, recurse=recurse)[0]
2025-09-28 14:08:50 -07:00
return value
2025-09-29 23:10:33 -07:00
@dataclass
class BackReference(Pointer):
pass
@dataclass
2025-09-27 15:13:17 -07:00
class Collection(Field):
"""
2025-09-28 14:08:50 -07:00
A collection of pointers.
2025-09-27 15:13:17 -07:00
"""
value_type: type = Record
default: List[value_type] = field(default_factory=lambda: [])
2025-09-27 15:13:17 -07:00
2025-09-28 14:08:50 -07:00
def _pointer(self, rec):
return Pointer(value_type=type(rec))
2025-09-29 23:10:33 -07:00
def serialize(self, values: List[value_type]) -> List[str]:
return [self._pointer(val).serialize(val) for val in values]
2025-09-27 15:13:17 -07:00
2025-09-29 23:10:33 -07:00
def deserialize(self, values: List[str], db: TinyDB, recurse: bool = True) -> List[value_type]:
2025-09-27 15:13:17 -07:00
"""
Recursively deserialize the objects in this collection
"""
2025-09-29 23:10:33 -07:00
recs = []
2025-09-28 12:12:05 -07:00
if not recurse:
2025-09-28 14:08:50 -07:00
return values
2025-09-29 23:10:33 -07:00
for val in values:
recs.append(self._pointer(val).deserialize(val, db=db, recurse=recurse))
return recs
def after_insert(self, db: TinyDB, record: Record) -> None:
"""
Populate any backreferences in the members of this collection with the parent record's uid.
"""
if not record[self.name]:
return
for member in record[self.name]:
2025-09-29 23:40:25 -07:00
target = Pointer.dereference(member, db=db)
for backref in target._metadata.backrefs(type(record)):
target[backref.name] = Pointer.reference(record)
db.table(target._metadata.table).update({backref.name: record}, where("uid") == target.uid)