{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:AKCNMAWVWS3M46QWRV2BKMWOJT","short_pith_number":"pith:AKCNMAWV","canonical_record":{"source":{"id":"1803.08869","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:30:06Z","cross_cats_sorted":["cs.LG","cs.SD","eess.AS"],"title_canon_sha256":"4c53ae9d4dc5c1e2c619cf8eaf4de5b4fe9c2b1f6887605713ad04520a9c3114","abstract_canon_sha256":"af75c5a1ca729532ebb4a9bba21a61c0996574d27067ab3f39fca84cba7530c4"},"schema_version":"1.0"},"canonical_sha256":"0284d602d5b4b6ce7a168d741532ce4ce8e108a2a214eb65ac07468acb735c90","source":{"kind":"arxiv","id":"1803.08869","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.08869","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"arxiv_version","alias_value":"1803.08869v2","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.08869","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"pith_short_12","alias_value":"AKCNMAWVWS3M","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"AKCNMAWVWS3M46QW","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"AKCNMAWV","created_at":"2026-05-18T12:32:13Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:AKCNMAWVWS3M46QWRV2BKMWOJT","target":"record","payload":{"canonical_record":{"source":{"id":"1803.08869","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:30:06Z","cross_cats_sorted":["cs.LG","cs.SD","eess.AS"],"title_canon_sha256":"4c53ae9d4dc5c1e2c619cf8eaf4de5b4fe9c2b1f6887605713ad04520a9c3114","abstract_canon_sha256":"af75c5a1ca729532ebb4a9bba21a61c0996574d27067ab3f39fca84cba7530c4"},"schema_version":"1.0"},"canonical_sha256":"0284d602d5b4b6ce7a168d741532ce4ce8e108a2a214eb65ac07468acb735c90","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:02:18.104969Z","signature_b64":"g6yF6Disl7YyYhjzK2KL/nufrSX0mX3ksXuWrIuHXLttnoVHNnFHhenCrHR4wfHXFcS8l2E1QX8gpQMc35/gCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0284d602d5b4b6ce7a168d741532ce4ce8e108a2a214eb65ac07468acb735c90","last_reissued_at":"2026-05-18T00:02:18.104452Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:02:18.104452Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.08869","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JBMcggk2Tu06UTaVg+PaClScFGvHxBhYp8Ioi6lUuhEcYby+jiBi28d44RReP9tbViqBAjFw0wwDrwEdkWjLDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T14:34:30.932454Z"},"content_sha256":"54e88a0e3143589566716dad051b0dded12241ebe9ddc2b11d1f44542544a7c4","schema_version":"1.0","event_id":"sha256:54e88a0e3143589566716dad051b0dded12241ebe9ddc2b11d1f44542544a7c4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:AKCNMAWVWS3M46QWRV2BKMWOJT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"On the difficulty of a distributional semantics of spoken language","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","cs.SD","eess.AS"],"primary_cat":"cs.CL","authors_text":"Afra Alishahi, \\'Akos K\\'ad\\'ar, Grzegorz Chrupa{\\l}a, Lieke Gelderloos","submitted_at":"2018-03-23T16:30:06Z","abstract_excerpt":"In the domain of unsupervised learning most work on speech has focused on discovering low-level constructs such as phoneme inventories or word-like units. In contrast, for written language, where there is a large body of work on unsupervised induction of semantic representations of words, whole sentences and longer texts. In this study we examine the challenges of adapting these approaches from written to spoken language. We conjecture that unsupervised learning of the semantics of spoken language becomes feasible if we abstract from the surface variability. We simulate this setting with a dat"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.08869","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Dx/2YSC3oPn9CHzYGTrsG9cUXWKV7XMN5CEnWFsNBbPUGw0KtLD4jwOLLWWFn4k+oRtvSF6tv/DEXOJ9qJ92BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T14:34:30.932801Z"},"content_sha256":"b53a064abe33696765b443677895d08f5922dc527908420cf7f116d62f160390","schema_version":"1.0","event_id":"sha256:b53a064abe33696765b443677895d08f5922dc527908420cf7f116d62f160390"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/bundle.json","state_url":"https://pith.science/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T14:34:30Z","links":{"resolver":"https://pith.science/pith/AKCNMAWVWS3M46QWRV2BKMWOJT","bundle":"https://pith.science/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/bundle.json","state":"https://pith.science/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/AKCNMAWVWS3M46QWRV2BKMWOJT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:AKCNMAWVWS3M46QWRV2BKMWOJT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"af75c5a1ca729532ebb4a9bba21a61c0996574d27067ab3f39fca84cba7530c4","cross_cats_sorted":["cs.LG","cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:30:06Z","title_canon_sha256":"4c53ae9d4dc5c1e2c619cf8eaf4de5b4fe9c2b1f6887605713ad04520a9c3114"},"schema_version":"1.0","source":{"id":"1803.08869","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.08869","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"arxiv_version","alias_value":"1803.08869v2","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.08869","created_at":"2026-05-18T00:02:18Z"},{"alias_kind":"pith_short_12","alias_value":"AKCNMAWVWS3M","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_16","alias_value":"AKCNMAWVWS3M46QW","created_at":"2026-05-18T12:32:13Z"},{"alias_kind":"pith_short_8","alias_value":"AKCNMAWV","created_at":"2026-05-18T12:32:13Z"}],"graph_snapshots":[{"event_id":"sha256:b53a064abe33696765b443677895d08f5922dc527908420cf7f116d62f160390","target":"graph","created_at":"2026-05-18T00:02:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In the domain of unsupervised learning most work on speech has focused on discovering low-level constructs such as phoneme inventories or word-like units. In contrast, for written language, where there is a large body of work on unsupervised induction of semantic representations of words, whole sentences and longer texts. In this study we examine the challenges of adapting these approaches from written to spoken language. We conjecture that unsupervised learning of the semantics of spoken language becomes feasible if we abstract from the surface variability. We simulate this setting with a dat","authors_text":"Afra Alishahi, \\'Akos K\\'ad\\'ar, Grzegorz Chrupa{\\l}a, Lieke Gelderloos","cross_cats":["cs.LG","cs.SD","eess.AS"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:30:06Z","title":"On the difficulty of a distributional semantics of spoken language"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.08869","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:54e88a0e3143589566716dad051b0dded12241ebe9ddc2b11d1f44542544a7c4","target":"record","created_at":"2026-05-18T00:02:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"af75c5a1ca729532ebb4a9bba21a61c0996574d27067ab3f39fca84cba7530c4","cross_cats_sorted":["cs.LG","cs.SD","eess.AS"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-03-23T16:30:06Z","title_canon_sha256":"4c53ae9d4dc5c1e2c619cf8eaf4de5b4fe9c2b1f6887605713ad04520a9c3114"},"schema_version":"1.0","source":{"id":"1803.08869","kind":"arxiv","version":2}},"canonical_sha256":"0284d602d5b4b6ce7a168d741532ce4ce8e108a2a214eb65ac07468acb735c90","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0284d602d5b4b6ce7a168d741532ce4ce8e108a2a214eb65ac07468acb735c90","first_computed_at":"2026-05-18T00:02:18.104452Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:02:18.104452Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"g6yF6Disl7YyYhjzK2KL/nufrSX0mX3ksXuWrIuHXLttnoVHNnFHhenCrHR4wfHXFcS8l2E1QX8gpQMc35/gCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:02:18.104969Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.08869","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:54e88a0e3143589566716dad051b0dded12241ebe9ddc2b11d1f44542544a7c4","sha256:b53a064abe33696765b443677895d08f5922dc527908420cf7f116d62f160390"],"state_sha256":"11d741ae6a1d21ff3f5a47e58e69581b7f43345001351629946b868788e78c71"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qva5eJ4Na3q72GMpq2npoDuXNjEGOqlE0a8udSMUgTfIhOnkqk++2bsKsvGQCNsWxz27I+Vp31JMmC67UYiMBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T14:34:30.934687Z","bundle_sha256":"da0ff6420f642e6ca8419f9b4528a13a3bedc8b4e2d01f3f7206deec331cb415"}}