{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:VG3E7SVYRZH5QICDAY62ZK3VSI","short_pith_number":"pith:VG3E7SVY","canonical_record":{"source":{"id":"1705.07368","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-05-20T23:45:54Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"0fd8aec34d4109061d368e2bd691308901d6d40cdfef7ac38f4e8b1ecf4bdab3","abstract_canon_sha256":"54bd88012a3a8960d57a3e1b3cc98f957a4094f28569a56ce1bfee3412e0a896"},"schema_version":"1.0"},"canonical_sha256":"a9b64fcab88e4fd82043063dacab759204d99f2c10520b7c882ab07b68471549","source":{"kind":"arxiv","id":"1705.07368","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.07368","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"arxiv_version","alias_value":"1705.07368v3","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.07368","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"pith_short_12","alias_value":"VG3E7SVYRZH5","created_at":"2026-05-18T12:31:49Z"},{"alias_kind":"pith_short_16","alias_value":"VG3E7SVYRZH5QICD","created_at":"2026-05-18T12:31:49Z"},{"alias_kind":"pith_short_8","alias_value":"VG3E7SVY","created_at":"2026-05-18T12:31:49Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:VG3E7SVYRZH5QICDAY62ZK3VSI","target":"record","payload":{"canonical_record":{"source":{"id":"1705.07368","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-05-20T23:45:54Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"0fd8aec34d4109061d368e2bd691308901d6d40cdfef7ac38f4e8b1ecf4bdab3","abstract_canon_sha256":"54bd88012a3a8960d57a3e1b3cc98f957a4094f28569a56ce1bfee3412e0a896"},"schema_version":"1.0"},"canonical_sha256":"a9b64fcab88e4fd82043063dacab759204d99f2c10520b7c882ab07b68471549","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:22:59.351330Z","signature_b64":"WZEXGlnb4orSjzYHtYUtvXZQqUZi1xRXUE06eomuDyJ0qZc+h0RvM/er4f5JMtCteORZNpdoT9F4oUrsXhK+Dg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a9b64fcab88e4fd82043063dacab759204d99f2c10520b7c882ab07b68471549","last_reissued_at":"2026-05-18T00:22:59.350820Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:22:59.350820Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1705.07368","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Wzg6hyAVb94TiMMN29aKGf3VvG5+clD4x1E1JBYAseYuGLPRYwVvMLf67mWmiegnrrvs3F4DiyJDvmPfgvTIBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T23:45:41.960859Z"},"content_sha256":"dee31210ba223204f2e847d9a8b3b754f7c155eb75204927783ce3b62357ee8b","schema_version":"1.0","event_id":"sha256:dee31210ba223204f2e847d9a8b3b754f7c155eb75204927783ce3b62357ee8b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:VG3E7SVYRZH5QICDAY62ZK3VSI","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Mixed Membership Word Embeddings for Computational Social Science","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.LG"],"primary_cat":"cs.CL","authors_text":"James Foulds","submitted_at":"2017-05-20T23:45:54Z","abstract_excerpt":"Word embeddings improve the performance of NLP systems by revealing the hidden structural relationships between words. Despite their success in many applications, word embeddings have seen very little use in computational social science NLP tasks, presumably due to their reliance on big data, and to a lack of interpretability. I propose a probabilistic model-based word embedding method which can recover interpretable embeddings, without big data. The key insight is to leverage mixed membership modeling, in which global representations are shared, but individual entities (i.e. dictionary words)"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.07368","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:22:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WS5i5LztyBhUAncndtrkoGORBFuYsdUUwoWQezSvogyAJdIQsoHpj8TPfFpDfs1QOZPTj2bKIcq+55pUubhdCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T23:45:41.961586Z"},"content_sha256":"e117544df0398eaa863fe5b341610aca499875432475242b75537b65e32c77fb","schema_version":"1.0","event_id":"sha256:e117544df0398eaa863fe5b341610aca499875432475242b75537b65e32c77fb"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/bundle.json","state_url":"https://pith.science/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-19T23:45:41Z","links":{"resolver":"https://pith.science/pith/VG3E7SVYRZH5QICDAY62ZK3VSI","bundle":"https://pith.science/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/bundle.json","state":"https://pith.science/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/state.json","well_known_bundle":"https://pith.science/.well-known/pith/VG3E7SVYRZH5QICDAY62ZK3VSI/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:VG3E7SVYRZH5QICDAY62ZK3VSI","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"54bd88012a3a8960d57a3e1b3cc98f957a4094f28569a56ce1bfee3412e0a896","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-05-20T23:45:54Z","title_canon_sha256":"0fd8aec34d4109061d368e2bd691308901d6d40cdfef7ac38f4e8b1ecf4bdab3"},"schema_version":"1.0","source":{"id":"1705.07368","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.07368","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"arxiv_version","alias_value":"1705.07368v3","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.07368","created_at":"2026-05-18T00:22:59Z"},{"alias_kind":"pith_short_12","alias_value":"VG3E7SVYRZH5","created_at":"2026-05-18T12:31:49Z"},{"alias_kind":"pith_short_16","alias_value":"VG3E7SVYRZH5QICD","created_at":"2026-05-18T12:31:49Z"},{"alias_kind":"pith_short_8","alias_value":"VG3E7SVY","created_at":"2026-05-18T12:31:49Z"}],"graph_snapshots":[{"event_id":"sha256:e117544df0398eaa863fe5b341610aca499875432475242b75537b65e32c77fb","target":"graph","created_at":"2026-05-18T00:22:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Word embeddings improve the performance of NLP systems by revealing the hidden structural relationships between words. Despite their success in many applications, word embeddings have seen very little use in computational social science NLP tasks, presumably due to their reliance on big data, and to a lack of interpretability. I propose a probabilistic model-based word embedding method which can recover interpretable embeddings, without big data. The key insight is to leverage mixed membership modeling, in which global representations are shared, but individual entities (i.e. dictionary words)","authors_text":"James Foulds","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-05-20T23:45:54Z","title":"Mixed Membership Word Embeddings for Computational Social Science"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.07368","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:dee31210ba223204f2e847d9a8b3b754f7c155eb75204927783ce3b62357ee8b","target":"record","created_at":"2026-05-18T00:22:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"54bd88012a3a8960d57a3e1b3cc98f957a4094f28569a56ce1bfee3412e0a896","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-05-20T23:45:54Z","title_canon_sha256":"0fd8aec34d4109061d368e2bd691308901d6d40cdfef7ac38f4e8b1ecf4bdab3"},"schema_version":"1.0","source":{"id":"1705.07368","kind":"arxiv","version":3}},"canonical_sha256":"a9b64fcab88e4fd82043063dacab759204d99f2c10520b7c882ab07b68471549","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a9b64fcab88e4fd82043063dacab759204d99f2c10520b7c882ab07b68471549","first_computed_at":"2026-05-18T00:22:59.350820Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:22:59.350820Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"WZEXGlnb4orSjzYHtYUtvXZQqUZi1xRXUE06eomuDyJ0qZc+h0RvM/er4f5JMtCteORZNpdoT9F4oUrsXhK+Dg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:22:59.351330Z","signed_message":"canonical_sha256_bytes"},"source_id":"1705.07368","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:dee31210ba223204f2e847d9a8b3b754f7c155eb75204927783ce3b62357ee8b","sha256:e117544df0398eaa863fe5b341610aca499875432475242b75537b65e32c77fb"],"state_sha256":"4ba546112bf7e23c31660fceed298de7a933259726fd0ecc509554a775e3f290"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7eGwRqyPmBNJNq7JyUY+8+0fRSoj/yFdCqjpGaY1BsCKpQdIZFn+AxhUhvMqKURMtkgscxIGey9LIWfAkI+vAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-19T23:45:41.965484Z","bundle_sha256":"0ae956d12310b42f2b503c4fbfc6b307c467a55e08afde2b260c1c04e9c748f5"}}