{
"id": "science.alt.dataset.arrayFormat",
"defs": {
"main": {
"type": "string",
"maxLength": 50,
"description": "Array serialization format identifier for NDArray fields in sample schemas. Known values correspond to token definitions in this Lexicon. Each format has versioned specifications maintained by alt.science at canonical URLs.",
"knownValues": [
"ndarrayBytes",
"sparseBytes",
"structuredBytes",
"arrowTensor",
"safetensors"
]
},
"arrowTensor": {
"type": "token",
"description": "Arrow tensor format. Stores multi-dimensional arrays using Arrow's tensor IPC format. Versions maintained at https://json-schema.alt.science/atdata-arrow-tensor/{version}/"
},
"safetensors": {
"type": "token",
"description": "Safetensors format (HuggingFace). Stores ML tensors with safe, memory-mapped access. Versions maintained at https://json-schema.alt.science/atdata-safetensors/{version}/"
},
"sparseBytes": {
"type": "token",
"description": "Scipy sparse matrix format (CSR/CSC/COO). Stores sparse matrices with indices and data arrays. Versions maintained at https://json-schema.alt.science/atdata-sparse-bytes/{version}/"
},
"ndarrayBytes": {
"type": "token",
"description": "Numpy .npy binary format for NDArray serialization. Stores arrays with dtype and shape in binary header. Versions maintained at https://json-schema.alt.science/atdata-ndarray-bytes/{version}/"
},
"structuredBytes": {
"type": "token",
"description": "Numpy structured array format. Stores arrays with named, typed fields (compound dtypes). Versions maintained at https://json-schema.alt.science/atdata-structured-bytes/{version}/"
}
},
"$type": "com.atproto.lexicon.schema",
"lexicon": 1
}
Metadata
- DID
-
did:web:lexicon.store
- CID
-
bafyreidnp5rawyh6edzahw6reii4xmvxe7q5zaxurin2vje3y6lcegkemi
- Indexed At
- 2026-03-20 15:55 UTC
- AT-URI
-
at://did:web:lexicon.store/com.atproto.lexicon.schema/science.alt.dataset.arrayFormat