commit 1fc0a7f2e8561c2ae8204bfd287a52ef684135b7 · dwn.poxiao-labs.work/atpasser

src/atpasser/model/converter.py

···

       15
        
           UnknownModel, RecordModel, QueryModel,

     

       16
        
           ProcedureModel, SubscriptionModel

     

       17
        
       )

     

       0
        
       
     

       0
        
       
     

       18
        
       

     

       19
        
       class LexiconConverter:

     

       20
        
           """

     
···

       30
        
               "boolean": BooleanModel,

     

       31
        
               "integer": IntegerModel,

     

       32
        
               "string": StringModel,

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       33
        
               

     

       34
        
               # Complex types

     

       35
        
               "array": ArrayModel,

···

       15
        
           UnknownModel, RecordModel, QueryModel,

     

       16
        
           ProcedureModel, SubscriptionModel

     

       17
        
       )

     

       18
       +
       from .types.binary import BytesModel, CidLinkModel

     

       19
       +
       from .blob import BlobModel

     

       20
        
       

     

       21
        
       class LexiconConverter:

     

       22
        
           """

     
···

       32
        
               "boolean": BooleanModel,

     

       33
        
               "integer": IntegerModel,

     

       34
        
               "string": StringModel,

     

       35
       +
               

     

       36
       +
               # Binary types

     

       37
       +
               "bytes": BytesModel,

     

       38
       +
               "cid-link": CidLinkModel,

     

       39
       +
               "blob": BlobModel,

     

       40
        
               

     

       41
        
               # Complex types

     

       42
        
               "array": ArrayModel,

+132

src/atpasser/model/types/binary.py

···

       1
       +
       """

     

       2
       +
       Binary data types for AT Protocol Lexicon models.

     

       3
       +
       

     

       4
       +
       Includes models for bytes, CID links and other binary data formats.

     

       5
       +
       """

     

       6
       +
       from typing import Any

     

       7
       +
       import base64

     

       8
       +
       from pydantic import field_validator, field_serializer

     

       9
       +
       from cid import CIDv1, make_cid

     

       10
       +
       from ..base import DataModel

     

       11
       +
       from ..exceptions import ValidationError, SerializationError, InvalidCIDError

     

       12
       +
       

     

       13
       +
       class BytesModel(DataModel):

     

       14
       +
           """

     

       15
       +
           Model for AT Protocol bytes type.

     

       16
       +
           

     

       17
       +
           Represents raw binary data that is encoded as base64 in JSON format.

     

       18
       +
           """

     

       19
       +
           

     

       20
       +
           value: bytes

     

       21
       +
           """Raw binary data"""

     

       22
       +
           

     

       23
       +
           min_length: int | None = None

     

       24
       +
           """Minimum size in bytes"""

     

       25
       +
           

     

       26
       +
           max_length: int | None = None

     

       27
       +
           """Maximum size in bytes"""

     

       28
       +
           

     

       29
       +
           def __init__(self, **data: Any) -> None:

     

       30
       +
               """

     

       31
       +
               Initialize bytes model with validation.

     

       32
       +
               

     

       33
       +
               Args:

     

       34
       +
                   **data: Input data containing bytes value and constraints

     

       35
       +
                   

     

       36
       +
               Raises:

     

       37
       +
                   ValidationError: If length constraints are violated

     

       38
       +
               """

     

       39
       +
               super().__init__(**data)

     

       40
       +
               

     

       41
       +
           @field_validator("value")

     

       42
       +
           def validate_length(cls, v: bytes, info: Any) -> bytes:

     

       43
       +
               """

     

       44
       +
               Validate bytes length against constraints.

     

       45
       +
               

     

       46
       +
               Args:

     

       47
       +
                   v: Bytes value to validate

     

       48
       +
                   info: Validation info containing field values

     

       49
       +
                   

     

       50
       +
               Returns:

     

       51
       +
                   Validated bytes

     

       52
       +
                   

     

       53
       +
               Raises:

     

       54
       +
                   ValidationError: If length constraints are violated

     

       55
       +
               """

     

       56
       +
               min_len = info.data.get("min_length")

     

       57
       +
               max_len = info.data.get("max_length")

     

       58
       +
               

     

       59
       +
               if min_len is not None and len(v) < min_len:

     

       60
       +
                   raise ValidationError(

     

       61
       +
                       field="value",

     

       62
       +
                       message=f"Bytes length {len(v)} is less than minimum {min_len}"

     

       63
       +
                   )

     

       64
       +
                   

     

       65
       +
               if max_len is not None and len(v) > max_len:

     

       66
       +
                   raise ValidationError(

     

       67
       +
                       field="value", 

     

       68
       +
                       message=f"Bytes length {len(v)} exceeds maximum {max_len}"

     

       69
       +
                   )

     

       70
       +
                   

     

       71
       +
               return v

     

       72
       +
               

     

       73
       +
           @field_serializer("value")

     

       74
       +
           def serialize_bytes(self, v: bytes) -> dict[str, str]:

     

       75
       +
               """

     

       76
       +
               Serialize bytes to JSON format with base64 encoding.

     

       77
       +
               

     

       78
       +
               Args:

     

       79
       +
                   v: Bytes to serialize

     

       80
       +
                   

     

       81
       +
               Returns:

     

       82
       +
                   Dictionary with base64 encoded bytes

     

       83
       +
                   

     

       84
       +
               Raises:

     

       85
       +
                   SerializationError: If encoding fails

     

       86
       +
               """

     

       87
       +
               try:

     

       88
       +
                   return {"$bytes": base64.b64encode(v).decode()}

     

       89
       +
               except Exception as e:

     

       90
       +
                   raise SerializationError("value", f"Failed to encode bytes: {e}")

     

       91
       +
       

     

       92
       +
       class CidLinkModel(DataModel):

     

       93
       +
           """

     

       94
       +
           Model for AT Protocol CID link type.

     

       95
       +
           

     

       96
       +
           Represents content-addressable links using CIDs (Content Identifiers).

     

       97
       +
           """

     

       98
       +
           

     

       99
       +
           link: CIDv1

     

       100
       +
           """CID reference to linked content"""

     

       101
       +
           

     

       102
       +
           def __init__(self, **data: Any) -> None:

     

       103
       +
               """

     

       104
       +
               Initialize CID link model with validation.

     

       105
       +
               

     

       106
       +
               Args:

     

       107
       +
                   **data: Input data containing CID link

     

       108
       +
                   

     

       109
       +
               Raises:

     

       110
       +
                   InvalidCIDError: If CID is invalid

     

       111
       +
               """

     

       112
       +
               # Handle JSON format with $link field

     

       113
       +
               if isinstance(data.get("link"), str):

     

       114
       +
                   try:

     

       115
       +
                       data["link"] = make_cid(data["link"])

     

       116
       +
                   except ValueError as e:

     

       117
       +
                       raise InvalidCIDError(f"Invalid CID: {e}")

     

       118
       +
                       

     

       119
       +
               super().__init__(**data)

     

       120
       +
               

     

       121
       +
           @field_serializer("link")

     

       122
       +
           def serialize_cid(self, v: CIDv1) -> dict[str, str]:

     

       123
       +
               """

     

       124
       +
               Serialize CID to JSON format.

     

       125
       +
               

     

       126
       +
               Args:

     

       127
       +
                   v: CID to serialize

     

       128
       +
                   

     

       129
       +
               Returns:

     

       130
       +
                   Dictionary with string CID representation

     

       131
       +
               """

     

       132
       +
               return {"$link": str(v)}

+26 -1

src/atpasser/model/types/complex.py

···

       138
        
           """Map of parameter names to their schema definitions"""

     

       139
        
           

     

       140
        
           value: dict[str, Any]

     

       141
       -
           """Parameter values"""

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       142
        
           

     

       143
        
           def __init__(self, **data: Any) -> None:

     

       144
        
               """

     
···

       185
        
                           raise ValueError(f"Parameter {param} must be integer")

     

       186
        
                       elif prop_type == "string" and not isinstance(value, str):

     

       187
        
                           raise ValueError(f"Parameter {param} must be string")

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       188
        
                           

     

       189
        
               return v

···

       138
        
           """Map of parameter names to their schema definitions"""

     

       139
        
           

     

       140
        
           value: dict[str, Any]

     

       141
       +
           """Parameter values

     

       142
       +
           

     

       143
       +
           Supported types:

     

       144
       +
           - boolean

     

       145
       +
           - integer

     

       146
       +
           - string

     

       147
       +
           - array (of boolean/integer/string/unknown)

     

       148
       +
           - unknown (object)

     

       149
       +
           """

     

       150
        
           

     

       151
        
           def __init__(self, **data: Any) -> None:

     

       152
        
               """

     
···

       193
        
                           raise ValueError(f"Parameter {param} must be integer")

     

       194
        
                       elif prop_type == "string" and not isinstance(value, str):

     

       195
        
                           raise ValueError(f"Parameter {param} must be string")

     

       196
       +
                       elif prop_type == "array":

     

       197
       +
                           if not isinstance(value, list):

     

       198
       +
                               raise ValueError(f"Parameter {param} must be array")

     

       199
       +
                           # Validate array items if schema is specified

     

       200
       +
                           if "items" in cls.properties[param]:

     

       201
       +
                               item_type = cls.properties[param]["items"].get("type")

     

       202
       +
                               for item in value:

     

       203
       +
                                   if item_type == "boolean" and not isinstance(item, bool):

     

       204
       +
                                       raise ValueError(f"Array item in {param} must be boolean")

     

       205
       +
                                   elif item_type == "integer" and not isinstance(item, int):

     

       206
       +
                                       raise ValueError(f"Array item in {param} must be integer")

     

       207
       +
                                   elif item_type == "string" and not isinstance(item, str):

     

       208
       +
                                       raise ValueError(f"Array item in {param} must be string")

     

       209
       +
                                   elif item_type == "unknown" and not isinstance(item, dict):

     

       210
       +
                                       raise ValueError(f"Array item in {param} must be object")

     

       211
       +
                       elif prop_type == "unknown" and not isinstance(value, dict):

     

       212
       +
                           raise ValueError(f"Parameter {param} must be object")

     

       213
        
                           

     

       214
        
               return v

+72 -1

src/atpasser/model/types/string.py

···

       88
        
                       cls._validate_did(v)

     

       89
        
                   elif cls.format == "handle":

     

       90
        
                       cls._validate_handle(v)

     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       91
        
                   

     

       92
        
               return v

     

       93
        
           

     
···

       121
        
               if not re.match(r"^[a-zA-Z0-9._-]+$", v):

     

       122
        
                   raise ValueError("Handle contains invalid characters")

     

       123
        
               if len(v) > 253:

     

       124
       -
                   raise ValueError("Handle too long, max 253 chars")
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0
        
       
     

       0

···

       88
        
                       cls._validate_did(v)

     

       89
        
                   elif cls.format == "handle":

     

       90
        
                       cls._validate_handle(v)

     

       91
       +
                   elif cls.format == "at-identifier":

     

       92
       +
                       cls._validate_at_identifier(v)

     

       93
       +
                   elif cls.format == "at-uri":

     

       94
       +
                       cls._validate_at_uri(v)

     

       95
       +
                   elif cls.format == "cid":

     

       96
       +
                       cls._validate_cid(v)

     

       97
       +
                   elif cls.format == "nsid":

     

       98
       +
                       cls._validate_nsid(v)

     

       99
       +
                   elif cls.format == "tid":

     

       100
       +
                       cls._validate_tid(v)

     

       101
       +
                   elif cls.format == "record-key":

     

       102
       +
                       cls._validate_record_key(v)

     

       103
       +
                   elif cls.format == "language":

     

       104
       +
                       cls._validate_language(v)

     

       105
        
                   

     

       106
        
               return v

     

       107
        
           

     
···

       135
        
               if not re.match(r"^[a-zA-Z0-9._-]+$", v):

     

       136
        
                   raise ValueError("Handle contains invalid characters")

     

       137
        
               if len(v) > 253:

     

       138
       +
                   raise ValueError("Handle too long, max 253 chars")

     

       139
       +
       

     

       140
       +
           @classmethod

     

       141
       +
           def _validate_at_identifier(cls, v: str) -> None:

     

       142
       +
               """Validate at-identifier format (DID or handle)"""

     

       143
       +
               try:

     

       144
       +
                   if v.startswith("did:"):

     

       145
       +
                       cls._validate_did(v)

     

       146
       +
                   else:

     

       147
       +
                       cls._validate_handle(v)

     

       148
       +
               except ValueError as e:

     

       149
       +
                   raise ValueError(f"Invalid at-identifier: {e}")

     

       150
       +
       

     

       151
       +
           @classmethod

     

       152
       +
           def _validate_at_uri(cls, v: str) -> None:

     

       153
       +
               """Validate AT-URI format"""

     

       154
       +
               if not v.startswith("at://"):

     

       155
       +
                   raise ValueError("AT-URI must start with 'at://'")

     

       156
       +
               if len(v) > 8000:

     

       157
       +
                   raise ValueError("AT-URI too long, max 8000 chars")

     

       158
       +
       

     

       159
       +
           @classmethod

     

       160
       +
           def _validate_cid(cls, v: str) -> None:

     

       161
       +
               """Validate CID string format"""

     

       162
       +
               if len(v) > 100:

     

       163
       +
                   raise ValueError("CID too long, max 100 chars")

     

       164
       +
               if not re.match(r"^[a-zA-Z0-9]+$", v):

     

       165
       +
                   raise ValueError("CID contains invalid characters")

     

       166
       +
       

     

       167
       +
           @classmethod

     

       168
       +
           def _validate_nsid(cls, v: str) -> None:

     

       169
       +
               """Validate NSID format"""

     

       170
       +
               if len(v) > 317:

     

       171
       +
                   raise ValueError("NSID too long, max 317 chars")

     

       172
       +
               if not re.match(r"^[a-zA-Z0-9.-]+$", v):

     

       173
       +
                   raise ValueError("NSID contains invalid characters")

     

       174
       +
       

     

       175
       +
           @classmethod

     

       176
       +
           def _validate_tid(cls, v: str) -> None:

     

       177
       +
               """Validate TID format"""

     

       178
       +
               if len(v) > 13:

     

       179
       +
                   raise ValueError("TID too long, max 13 chars")

     

       180
       +
               if not re.match(r"^[234567abcdefghijklmnopqrstuvwxyz]+$", v):

     

       181
       +
                   raise ValueError("TID contains invalid characters")

     

       182
       +
       

     

       183
       +
           @classmethod

     

       184
       +
           def _validate_record_key(cls, v: str) -> None:

     

       185
       +
               """Validate record-key format"""

     

       186
       +
               if len(v) > 512:

     

       187
       +
                   raise ValueError("Record key too long, max 512 chars")

     

       188
       +
               if not re.match(r"^[a-zA-Z0-9._:%-~]+$", v):

     

       189
       +
                   raise ValueError("Record key contains invalid characters")

     

       190
       +
       

     

       191
       +
           @classmethod

     

       192
       +
           def _validate_language(cls, v: str) -> None:

     

       193
       +
               """Validate BCP 47 language tag"""

     

       194
       +
               if not re.match(r"^[a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*$", v):

     

       195
       +
                   raise ValueError("Invalid language tag format")