{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:2H2TU4BL4YYCYG3Y6ADTMM73OQ","short_pith_number":"pith:2H2TU4BL","canonical_record":{"source":{"id":"1506.02004","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-06-05T18:20:43Z","cross_cats_sorted":[],"title_canon_sha256":"64e1884812372238f5ac14fc76fa5550f3c52d0f1ba4832a96b6965b17ad868a","abstract_canon_sha256":"4475af00928a2868cba428b629ef815b3aab47b1837be11bbdb890b6eff2a1b6"},"schema_version":"1.0"},"canonical_sha256":"d1f53a702be6302c1b78f0073633fb743fea7a7af6bdd3845e5ccde0764d7904","source":{"kind":"arxiv","id":"1506.02004","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1506.02004","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"arxiv_version","alias_value":"1506.02004v1","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1506.02004","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"pith_short_12","alias_value":"2H2TU4BL4YYC","created_at":"2026-05-18T12:28:59Z"},{"alias_kind":"pith_short_16","alias_value":"2H2TU4BL4YYCYG3Y","created_at":"2026-05-18T12:28:59Z"},{"alias_kind":"pith_short_8","alias_value":"2H2TU4BL","created_at":"2026-05-18T12:28:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:2H2TU4BL4YYCYG3Y6ADTMM73OQ","target":"record","payload":{"canonical_record":{"source":{"id":"1506.02004","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-06-05T18:20:43Z","cross_cats_sorted":[],"title_canon_sha256":"64e1884812372238f5ac14fc76fa5550f3c52d0f1ba4832a96b6965b17ad868a","abstract_canon_sha256":"4475af00928a2868cba428b629ef815b3aab47b1837be11bbdb890b6eff2a1b6"},"schema_version":"1.0"},"canonical_sha256":"d1f53a702be6302c1b78f0073633fb743fea7a7af6bdd3845e5ccde0764d7904","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:55:58.705660Z","signature_b64":"w3rjESMlgS0YN1gnWxLhbbrxM1pNw2IYrS38IEUIpTTIeTmEgl9yZDvptE9+HNE7yTX/gr2GoGf146T1YuKhAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d1f53a702be6302c1b78f0073633fb743fea7a7af6bdd3845e5ccde0764d7904","last_reissued_at":"2026-05-18T01:55:58.705137Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:55:58.705137Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1506.02004","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:55:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"X6cv4bb393f3JKkxnNL1f+1nJE7RF9lSPyZPNvjG+TBox3nTg/7M0b0u6uXQY3RgNxoDSWbloxtQga2DeOfRBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T19:30:27.957251Z"},"content_sha256":"1bc030d0f210ec6b0ad1b1c079956f0a6376459d1f932048fa25a061068db665","schema_version":"1.0","event_id":"sha256:1bc030d0f210ec6b0ad1b1c079956f0a6376459d1f932048fa25a061068db665"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:2H2TU4BL4YYCYG3Y6ADTMM73OQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sparse Overcomplete Word Vector Representations","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Chris Dyer, Dani Yogatama, Manaal Faruqui, Noah Smith, Yulia Tsvetkov","submitted_at":"2015-06-05T18:20:43Z","abstract_excerpt":"Current distributed representations of words show little resemblance to theories of lexical semantics. The former are dense and uninterpretable, the latter largely based on familiar, discrete classes (e.g., supersenses) and relations (e.g., synonymy and hypernymy). We propose methods that transform word vectors into sparse (and optionally binary) vectors. The resulting representations are more similar to the interpretable features typically used in NLP, though they are discovered automatically from raw corpora. Because the vectors are highly sparse, they are computationally easy to work with. "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1506.02004","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:55:58Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BpiN0ZOv4reF7M54dTDjoawbHJXYNwYoQtVW8cYpREVULzo9JjSxWrqXcGef6M1Kq4Uam7PSkG4kN8+V6xyTDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T19:30:27.957904Z"},"content_sha256":"3ed6f0f045faae5020da859b8bdc7d276d3d76ee9e8cef8f7132d58a1bd584c5","schema_version":"1.0","event_id":"sha256:3ed6f0f045faae5020da859b8bdc7d276d3d76ee9e8cef8f7132d58a1bd584c5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/bundle.json","state_url":"https://pith.science/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-24T19:30:27Z","links":{"resolver":"https://pith.science/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ","bundle":"https://pith.science/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/bundle.json","state":"https://pith.science/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2H2TU4BL4YYCYG3Y6ADTMM73OQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:2H2TU4BL4YYCYG3Y6ADTMM73OQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4475af00928a2868cba428b629ef815b3aab47b1837be11bbdb890b6eff2a1b6","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-06-05T18:20:43Z","title_canon_sha256":"64e1884812372238f5ac14fc76fa5550f3c52d0f1ba4832a96b6965b17ad868a"},"schema_version":"1.0","source":{"id":"1506.02004","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1506.02004","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"arxiv_version","alias_value":"1506.02004v1","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1506.02004","created_at":"2026-05-18T01:55:58Z"},{"alias_kind":"pith_short_12","alias_value":"2H2TU4BL4YYC","created_at":"2026-05-18T12:28:59Z"},{"alias_kind":"pith_short_16","alias_value":"2H2TU4BL4YYCYG3Y","created_at":"2026-05-18T12:28:59Z"},{"alias_kind":"pith_short_8","alias_value":"2H2TU4BL","created_at":"2026-05-18T12:28:59Z"}],"graph_snapshots":[{"event_id":"sha256:3ed6f0f045faae5020da859b8bdc7d276d3d76ee9e8cef8f7132d58a1bd584c5","target":"graph","created_at":"2026-05-18T01:55:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Current distributed representations of words show little resemblance to theories of lexical semantics. The former are dense and uninterpretable, the latter largely based on familiar, discrete classes (e.g., supersenses) and relations (e.g., synonymy and hypernymy). We propose methods that transform word vectors into sparse (and optionally binary) vectors. The resulting representations are more similar to the interpretable features typically used in NLP, though they are discovered automatically from raw corpora. Because the vectors are highly sparse, they are computationally easy to work with. ","authors_text":"Chris Dyer, Dani Yogatama, Manaal Faruqui, Noah Smith, Yulia Tsvetkov","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-06-05T18:20:43Z","title":"Sparse Overcomplete Word Vector Representations"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1506.02004","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1bc030d0f210ec6b0ad1b1c079956f0a6376459d1f932048fa25a061068db665","target":"record","created_at":"2026-05-18T01:55:58Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4475af00928a2868cba428b629ef815b3aab47b1837be11bbdb890b6eff2a1b6","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-06-05T18:20:43Z","title_canon_sha256":"64e1884812372238f5ac14fc76fa5550f3c52d0f1ba4832a96b6965b17ad868a"},"schema_version":"1.0","source":{"id":"1506.02004","kind":"arxiv","version":1}},"canonical_sha256":"d1f53a702be6302c1b78f0073633fb743fea7a7af6bdd3845e5ccde0764d7904","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d1f53a702be6302c1b78f0073633fb743fea7a7af6bdd3845e5ccde0764d7904","first_computed_at":"2026-05-18T01:55:58.705137Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:55:58.705137Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"w3rjESMlgS0YN1gnWxLhbbrxM1pNw2IYrS38IEUIpTTIeTmEgl9yZDvptE9+HNE7yTX/gr2GoGf146T1YuKhAA==","signature_status":"signed_v1","signed_at":"2026-05-18T01:55:58.705660Z","signed_message":"canonical_sha256_bytes"},"source_id":"1506.02004","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1bc030d0f210ec6b0ad1b1c079956f0a6376459d1f932048fa25a061068db665","sha256:3ed6f0f045faae5020da859b8bdc7d276d3d76ee9e8cef8f7132d58a1bd584c5"],"state_sha256":"3061f0d6e0dd0b3fbc84b9708872b9852bf5ad44ca754d57dd5ef3988ed0a14a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Zo7D0CSWP1QgGsMVc0Cv62zTywL1JmOWQYtK0B1kUeC4YLbB+1GvAqZbyM4P4euUqnnXlQ7g3un3MCpXZ2/oAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-24T19:30:27.961906Z","bundle_sha256":"c476e83b4d710f6d0e236171bd386fe17401d4007fbd6d5d95d0c8f5a7b7c3ca"}}