{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:LRQMIUSHT3DEJAY4SSBYZVSWVV","short_pith_number":"pith:LRQMIUSH","canonical_record":{"source":{"id":"1604.06737","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","cross_cats_sorted":[],"title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b","abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7"},"schema_version":"1.0"},"canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","source":{"kind":"arxiv","id":"1604.06737","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"arxiv_version","alias_value":"1604.06737v1","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"pith_short_12","alias_value":"LRQMIUSHT3DE","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_16","alias_value":"LRQMIUSHT3DEJAY4","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_8","alias_value":"LRQMIUSH","created_at":"2026-05-18T12:30:29Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:LRQMIUSHT3DEJAY4SSBYZVSWVV","target":"record","payload":{"canonical_record":{"source":{"id":"1604.06737","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","cross_cats_sorted":[],"title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b","abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7"},"schema_version":"1.0"},"canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:16:28.288325Z","signature_b64":"cHRtLeuD1KaC6hUXvv7HWWXp1knqT2/Ss/MXLDOXz5o1dlx6ykALKRiDaAJjCTkoUjbYJDV961AhTPUGjiX6DA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","last_reissued_at":"2026-05-18T01:16:28.287701Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:16:28.287701Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1604.06737","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:16:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"tqbNqMIzNwsylbFmoerskkrE+weFEiBEEe/lEMwZ/zXoffXiWKxSPJHEnaehHJUpekfAkI4ysyqeoJxyp3tvCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T16:49:06.399906Z"},"content_sha256":"888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814","schema_version":"1.0","event_id":"sha256:888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:LRQMIUSHT3DEJAY4SSBYZVSWVV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Entity Embeddings of Categorical Variables","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Cheng Guo, Felix Berkhahn","submitted_at":"2016-04-22T16:34:30Z","abstract_excerpt":"We map categorical variables in a function approximation problem into Euclidean spaces, which are the entity embeddings of the categorical variables. The mapping is learned by a neural network during the standard supervised training process. Entity embedding not only reduces memory usage and speeds up neural networks compared with one-hot encoding, but more importantly by mapping similar values close to each other in the embedding space it reveals the intrinsic properties of the categorical variables. We applied it successfully in a recent Kaggle competition and were able to reach the third po"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.06737","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:16:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"h0I7SSMlXZ6BG12oswsg2OIIBScnINyvA5lSUujzwMfb272byGgge/wteFSEBD5YD5xYLwhuyPsWnH3crUmsBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T16:49:06.400479Z"},"content_sha256":"6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb","schema_version":"1.0","event_id":"sha256:6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/bundle.json","state_url":"https://pith.science/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T16:49:06Z","links":{"resolver":"https://pith.science/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV","bundle":"https://pith.science/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/bundle.json","state":"https://pith.science/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LRQMIUSHT3DEJAY4SSBYZVSWVV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:LRQMIUSHT3DEJAY4SSBYZVSWVV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b"},"schema_version":"1.0","source":{"id":"1604.06737","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"arxiv_version","alias_value":"1604.06737v1","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"pith_short_12","alias_value":"LRQMIUSHT3DE","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_16","alias_value":"LRQMIUSHT3DEJAY4","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_8","alias_value":"LRQMIUSH","created_at":"2026-05-18T12:30:29Z"}],"graph_snapshots":[{"event_id":"sha256:6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb","target":"graph","created_at":"2026-05-18T01:16:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We map categorical variables in a function approximation problem into Euclidean spaces, which are the entity embeddings of the categorical variables. The mapping is learned by a neural network during the standard supervised training process. Entity embedding not only reduces memory usage and speeds up neural networks compared with one-hot encoding, but more importantly by mapping similar values close to each other in the embedding space it reveals the intrinsic properties of the categorical variables. We applied it successfully in a recent Kaggle competition and were able to reach the third po","authors_text":"Cheng Guo, Felix Berkhahn","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title":"Entity Embeddings of Categorical Variables"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.06737","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814","target":"record","created_at":"2026-05-18T01:16:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b"},"schema_version":"1.0","source":{"id":"1604.06737","kind":"arxiv","version":1}},"canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","first_computed_at":"2026-05-18T01:16:28.287701Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:16:28.287701Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"cHRtLeuD1KaC6hUXvv7HWWXp1knqT2/Ss/MXLDOXz5o1dlx6ykALKRiDaAJjCTkoUjbYJDV961AhTPUGjiX6DA==","signature_status":"signed_v1","signed_at":"2026-05-18T01:16:28.288325Z","signed_message":"canonical_sha256_bytes"},"source_id":"1604.06737","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814","sha256:6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb"],"state_sha256":"2c3cdc5fd898d18ad3ce7cf4b2447b019e04a8ac0fef24e9cec27f7d5eb72080"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DJH3NZhclXtbF+GL/B1cfF703TPj1e83xPvsNMr9WmT/u799BtL4318fAAHWtDjpXPL0BUvBL7G3bxxxi5V/Bw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T16:49:06.404524Z","bundle_sha256":"e3b584f6f4d845e924b28982acfc60c8b8b8869acc79f490167c84c69030d133"}}