{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:LRQMIUSHT3DEJAY4SSBYZVSWVV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b"},"schema_version":"1.0","source":{"id":"1604.06737","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"arxiv_version","alias_value":"1604.06737v1","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.06737","created_at":"2026-05-18T01:16:28Z"},{"alias_kind":"pith_short_12","alias_value":"LRQMIUSHT3DE","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_16","alias_value":"LRQMIUSHT3DEJAY4","created_at":"2026-05-18T12:30:29Z"},{"alias_kind":"pith_short_8","alias_value":"LRQMIUSH","created_at":"2026-05-18T12:30:29Z"}],"graph_snapshots":[{"event_id":"sha256:6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb","target":"graph","created_at":"2026-05-18T01:16:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We map categorical variables in a function approximation problem into Euclidean spaces, which are the entity embeddings of the categorical variables. The mapping is learned by a neural network during the standard supervised training process. Entity embedding not only reduces memory usage and speeds up neural networks compared with one-hot encoding, but more importantly by mapping similar values close to each other in the embedding space it reveals the intrinsic properties of the categorical variables. We applied it successfully in a recent Kaggle competition and were able to reach the third po","authors_text":"Cheng Guo, Felix Berkhahn","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title":"Entity Embeddings of Categorical Variables"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.06737","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814","target":"record","created_at":"2026-05-18T01:16:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"665cffb3c16dfdf6c954077ea2a37b19461d62a17857d3371e05b8db8ee8bfc7","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-04-22T16:34:30Z","title_canon_sha256":"a283193b775e748b5612714559aa38b042bd30ffa3b6719c30b0fc2b2c48e78b"},"schema_version":"1.0","source":{"id":"1604.06737","kind":"arxiv","version":1}},"canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5c60c452479ec644831c94838cd656ad4e1f704644bba58689b522b7b7b0f4f3","first_computed_at":"2026-05-18T01:16:28.287701Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:16:28.287701Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"cHRtLeuD1KaC6hUXvv7HWWXp1knqT2/Ss/MXLDOXz5o1dlx6ykALKRiDaAJjCTkoUjbYJDV961AhTPUGjiX6DA==","signature_status":"signed_v1","signed_at":"2026-05-18T01:16:28.288325Z","signed_message":"canonical_sha256_bytes"},"source_id":"1604.06737","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:888c3b8da10f40f0e3d0c5d98afd7c0701bca0a2626d24bd8f36c266f4f8c814","sha256:6a1b241e08990df955d73dbfc140adfeddc34fc399ee8b51d27ad101c51b8dcb"],"state_sha256":"2c3cdc5fd898d18ad3ce7cf4b2447b019e04a8ac0fef24e9cec27f7d5eb72080"}