{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2025:CTB2TRVXFYOWF4XY3YTUOAVX4C","short_pith_number":"pith:CTB2TRVX","schema_version":"1.0","canonical_sha256":"14c3a9c6b72e1d62f2f8de274702b7e0bdfc07b91c6bd0fa9365a0c4f5308601","source":{"kind":"arxiv","id":"2510.13068","version":4},"attestation_state":"computed","paper":{"title":"NeuroRVQ: Multi-Scale Biosignal Tokenization for Generative Foundation Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.HC"],"primary_cat":"cs.LG","authors_text":"Alexandros Koliousis, Dario Farina, Dimitrios A. Adamos, Dimitrios Chalatsis, Konstantinos Barmpas, Na Lee, Nikolaos Laskaris, Stefanos Zafeiriou, William Raftery, Yannis Panagakis","submitted_at":"2025-10-15T01:26:52Z","abstract_excerpt":"Biosignals such as electroencephalography (EEG), electrocardiography (ECG), and electromyography (EMG) encode physiological activity across multiple temporal and spectral scales, yielding representations that are rich but challenging for machine learning. Foundation models trained to predict masked signal tokens have shown promise in learning generalizable biosignal representations, yet their performance depends on the tokenizer's ability to preserve high-frequency dynamics and reconstruct signals with high fidelity. We introduce NeuroRVQ, a modality-adaptive biosignal tokenizer family designe"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2510.13068","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-10-15T01:26:52Z","cross_cats_sorted":["cs.AI","cs.HC"],"title_canon_sha256":"3162583c536829ebf67f2ffd70f742494792f2279d23853631834dc1b5837640","abstract_canon_sha256":"caecca1559ef7d8cf864d015b4f8029b6d0abe88a73038d6c039520667bb8481"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:04:14.743574Z","signature_b64":"6YoxP8KsqMaTiOFmiXPk/AeBFrUwfCjiFOmj5jRnG4NC7QG2ELGkl16YDhWAiBWpuJRXAorpAfxdYRdyErwjBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"14c3a9c6b72e1d62f2f8de274702b7e0bdfc07b91c6bd0fa9365a0c4f5308601","last_reissued_at":"2026-05-20T00:04:14.742773Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:04:14.742773Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"NeuroRVQ: Multi-Scale Biosignal Tokenization for Generative Foundation Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.HC"],"primary_cat":"cs.LG","authors_text":"Alexandros Koliousis, Dario Farina, Dimitrios A. Adamos, Dimitrios Chalatsis, Konstantinos Barmpas, Na Lee, Nikolaos Laskaris, Stefanos Zafeiriou, William Raftery, Yannis Panagakis","submitted_at":"2025-10-15T01:26:52Z","abstract_excerpt":"Biosignals such as electroencephalography (EEG), electrocardiography (ECG), and electromyography (EMG) encode physiological activity across multiple temporal and spectral scales, yielding representations that are rich but challenging for machine learning. Foundation models trained to predict masked signal tokens have shown promise in learning generalizable biosignal representations, yet their performance depends on the tokenizer's ability to preserve high-frequency dynamics and reconstruct signals with high fidelity. We introduce NeuroRVQ, a modality-adaptive biosignal tokenizer family designe"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2510.13068","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2510.13068/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2510.13068","created_at":"2026-05-20T00:04:14.742909+00:00"},{"alias_kind":"arxiv_version","alias_value":"2510.13068v4","created_at":"2026-05-20T00:04:14.742909+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2510.13068","created_at":"2026-05-20T00:04:14.742909+00:00"},{"alias_kind":"pith_short_12","alias_value":"CTB2TRVXFYOW","created_at":"2026-05-20T00:04:14.742909+00:00"},{"alias_kind":"pith_short_16","alias_value":"CTB2TRVXFYOWF4XY","created_at":"2026-05-20T00:04:14.742909+00:00"},{"alias_kind":"pith_short_8","alias_value":"CTB2TRVX","created_at":"2026-05-20T00:04:14.742909+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":1,"internal_anchor_count":1,"sample":[{"citing_arxiv_id":"2604.28178","citing_title":"LLM as Clinical Graph Structure Refiner: Enhancing Representation Learning in EEG Seizure Diagnosis","ref_index":3,"is_internal_anchor":true}]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C","json":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C.json","graph_json":"https://pith.science/api/pith-number/CTB2TRVXFYOWF4XY3YTUOAVX4C/graph.json","events_json":"https://pith.science/api/pith-number/CTB2TRVXFYOWF4XY3YTUOAVX4C/events.json","paper":"https://pith.science/paper/CTB2TRVX"},"agent_actions":{"view_html":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C","download_json":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C.json","view_paper":"https://pith.science/paper/CTB2TRVX","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2510.13068&json=true","fetch_graph":"https://pith.science/api/pith-number/CTB2TRVXFYOWF4XY3YTUOAVX4C/graph.json","fetch_events":"https://pith.science/api/pith-number/CTB2TRVXFYOWF4XY3YTUOAVX4C/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C/action/timestamp_anchor","attest_storage":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C/action/storage_attestation","attest_author":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C/action/author_attestation","sign_citation":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C/action/citation_signature","submit_replication":"https://pith.science/pith/CTB2TRVXFYOWF4XY3YTUOAVX4C/action/replication_record"}},"created_at":"2026-05-20T00:04:14.742909+00:00","updated_at":"2026-05-20T00:04:14.742909+00:00"}