{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:NSCUFH7435SHGFJGZUL6AWRLI7","short_pith_number":"pith:NSCUFH74","canonical_record":{"source":{"id":"1809.08621","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-09-23T16:02:03Z","cross_cats_sorted":[],"title_canon_sha256":"1c4b747d05789a6590b84e9f81760aa611e68e9401ee2c2a51974d5d6e4ac92c","abstract_canon_sha256":"958cc5a060cb3d978ac13bd181e5dd8478f9ac5dd7036b0897bb654dde617d8b"},"schema_version":"1.0"},"canonical_sha256":"6c85429ffcdf64731526cd17e05a2b47ffde81df9d3c891911fbc5f4f52a023f","source":{"kind":"arxiv","id":"1809.08621","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.08621","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"arxiv_version","alias_value":"1809.08621v2","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.08621","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"pith_short_12","alias_value":"NSCUFH7435SH","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_16","alias_value":"NSCUFH7435SHGFJG","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_8","alias_value":"NSCUFH74","created_at":"2026-05-18T12:32:40Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:NSCUFH7435SHGFJGZUL6AWRLI7","target":"record","payload":{"canonical_record":{"source":{"id":"1809.08621","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-09-23T16:02:03Z","cross_cats_sorted":[],"title_canon_sha256":"1c4b747d05789a6590b84e9f81760aa611e68e9401ee2c2a51974d5d6e4ac92c","abstract_canon_sha256":"958cc5a060cb3d978ac13bd181e5dd8478f9ac5dd7036b0897bb654dde617d8b"},"schema_version":"1.0"},"canonical_sha256":"6c85429ffcdf64731526cd17e05a2b47ffde81df9d3c891911fbc5f4f52a023f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:04:54.254043Z","signature_b64":"Q03dtIWG+4oANDN6tDO3vAwe1QOJ0nO/OFlU7ZCmOAUMkOWzZDs1VruA6RCiKVpeNJzvV5Laa9b/7RP/qbRWBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6c85429ffcdf64731526cd17e05a2b47ffde81df9d3c891911fbc5f4f52a023f","last_reissued_at":"2026-05-18T00:04:54.253432Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:04:54.253432Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1809.08621","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:04:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IyjeO4dLBHK8m2Ttqan0Oz6JQ6RC+qietSWUepx0jIHOh/FTdEjs7e7Zh2qCLp1XAPgGkVANpG1r+dkxDg71DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T12:20:27.315821Z"},"content_sha256":"d1fe5fa16205baf778bcc9abbf7ca57fed87473ea530c4cbe0099eb951a80687","schema_version":"1.0","event_id":"sha256:d1fe5fa16205baf778bcc9abbf7ca57fed87473ea530c4cbe0099eb951a80687"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:NSCUFH7435SHGFJGZUL6AWRLI7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning and Evaluating Sparse Interpretable Sentence Embeddings","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Anna Potapenko, Octavian-Eugen Ganea, Thomas Hofmann, Valentin Trifonov","submitted_at":"2018-09-23T16:02:03Z","abstract_excerpt":"Previous research on word embeddings has shown that sparse representations, which can be either learned on top of existing dense embeddings or obtained through model constraints during training time, have the benefit of increased interpretability properties: to some degree, each dimension can be understood by a human and associated with a recognizable feature in the data. In this paper, we transfer this idea to sentence embeddings and explore several approaches to obtain a sparse representation. We further introduce a novel, quantitative and automated evaluation metric for sentence embedding i"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.08621","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:04:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"acITdl9lLdHj1mwaP+S8SxtNGMa+lfdman6sxD+YIlejrBjtKkQvWkOwzveYlGM/bdv6VcIhkbu8ZlTrvF03Ag==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T12:20:27.316528Z"},"content_sha256":"804bd3d2cebd906d076f4ed1c06c1405eab16818ecfa49facc8d91f929f273bf","schema_version":"1.0","event_id":"sha256:804bd3d2cebd906d076f4ed1c06c1405eab16818ecfa49facc8d91f929f273bf"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NSCUFH7435SHGFJGZUL6AWRLI7/bundle.json","state_url":"https://pith.science/pith/NSCUFH7435SHGFJGZUL6AWRLI7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NSCUFH7435SHGFJGZUL6AWRLI7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T12:20:27Z","links":{"resolver":"https://pith.science/pith/NSCUFH7435SHGFJGZUL6AWRLI7","bundle":"https://pith.science/pith/NSCUFH7435SHGFJGZUL6AWRLI7/bundle.json","state":"https://pith.science/pith/NSCUFH7435SHGFJGZUL6AWRLI7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NSCUFH7435SHGFJGZUL6AWRLI7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:NSCUFH7435SHGFJGZUL6AWRLI7","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"958cc5a060cb3d978ac13bd181e5dd8478f9ac5dd7036b0897bb654dde617d8b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-09-23T16:02:03Z","title_canon_sha256":"1c4b747d05789a6590b84e9f81760aa611e68e9401ee2c2a51974d5d6e4ac92c"},"schema_version":"1.0","source":{"id":"1809.08621","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.08621","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"arxiv_version","alias_value":"1809.08621v2","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.08621","created_at":"2026-05-18T00:04:54Z"},{"alias_kind":"pith_short_12","alias_value":"NSCUFH7435SH","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_16","alias_value":"NSCUFH7435SHGFJG","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_8","alias_value":"NSCUFH74","created_at":"2026-05-18T12:32:40Z"}],"graph_snapshots":[{"event_id":"sha256:804bd3d2cebd906d076f4ed1c06c1405eab16818ecfa49facc8d91f929f273bf","target":"graph","created_at":"2026-05-18T00:04:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Previous research on word embeddings has shown that sparse representations, which can be either learned on top of existing dense embeddings or obtained through model constraints during training time, have the benefit of increased interpretability properties: to some degree, each dimension can be understood by a human and associated with a recognizable feature in the data. In this paper, we transfer this idea to sentence embeddings and explore several approaches to obtain a sparse representation. We further introduce a novel, quantitative and automated evaluation metric for sentence embedding i","authors_text":"Anna Potapenko, Octavian-Eugen Ganea, Thomas Hofmann, Valentin Trifonov","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-09-23T16:02:03Z","title":"Learning and Evaluating Sparse Interpretable Sentence Embeddings"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.08621","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d1fe5fa16205baf778bcc9abbf7ca57fed87473ea530c4cbe0099eb951a80687","target":"record","created_at":"2026-05-18T00:04:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"958cc5a060cb3d978ac13bd181e5dd8478f9ac5dd7036b0897bb654dde617d8b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-09-23T16:02:03Z","title_canon_sha256":"1c4b747d05789a6590b84e9f81760aa611e68e9401ee2c2a51974d5d6e4ac92c"},"schema_version":"1.0","source":{"id":"1809.08621","kind":"arxiv","version":2}},"canonical_sha256":"6c85429ffcdf64731526cd17e05a2b47ffde81df9d3c891911fbc5f4f52a023f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6c85429ffcdf64731526cd17e05a2b47ffde81df9d3c891911fbc5f4f52a023f","first_computed_at":"2026-05-18T00:04:54.253432Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:04:54.253432Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Q03dtIWG+4oANDN6tDO3vAwe1QOJ0nO/OFlU7ZCmOAUMkOWzZDs1VruA6RCiKVpeNJzvV5Laa9b/7RP/qbRWBw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:04:54.254043Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.08621","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d1fe5fa16205baf778bcc9abbf7ca57fed87473ea530c4cbe0099eb951a80687","sha256:804bd3d2cebd906d076f4ed1c06c1405eab16818ecfa49facc8d91f929f273bf"],"state_sha256":"83ebfe98350d7820bb4fa7ac5aea3e29f7dbe6fa02f1a98b92b2789d045ee0a3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"W8hTIiqHYlum57lHuluwR7IgI3hG5UMGEhouleWSnqil8HBGlahqmjMtcbZF9sNwR2zr5mKBPsEbR72Sm06dCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T12:20:27.319959Z","bundle_sha256":"87f1803a228b60d7e64fc40dd5b665b1badbe15c0c9dc7581ca7f1f956439ca7"}}