{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2014:6KH7XFXNOUSPOZZUAEXILNEHDU","short_pith_number":"pith:6KH7XFXN","schema_version":"1.0","canonical_sha256":"f28ffb96ed7524f76734012e85b4871d0a20cbe70ea8a3d940e76ce3845b6fa8","source":{"kind":"arxiv","id":"1407.1640","version":1},"attestation_state":"computed","paper":{"title":"WordRep: A Benchmark for Research on Learning Word Representations","license":"http://creativecommons.org/licenses/by/3.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Bin Gao, Jiang Bian, Tie-Yan Liu","submitted_at":"2014-07-07T09:31:21Z","abstract_excerpt":"WordRep is a benchmark collection for the research on learning distributed word representations (or word embeddings), released by Microsoft Research. In this paper, we describe the details of the WordRep collection and show how to use it in different types of machine learning research related to word embedding. Specifically, we describe how the evaluation tasks in WordRep are selected, how the data are sampled, and how the evaluation tool is built. We then compare several state-of-the-art word representations on WordRep, report their evaluation performance, and make discussions on the results."},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1407.1640","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/3.0/","primary_cat":"cs.CL","submitted_at":"2014-07-07T09:31:21Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"24b1c9a72b5b90dc7fb5b8f6f060e498fc4987d6328a83b6d2fe6daa3edae284","abstract_canon_sha256":"94e8e35f70cb622f7f9079c4544009e989ae7cdbf2abfa59a688aca099231e64"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:48:10.840592Z","signature_b64":"OGwM9MDse9lGdWkuoy14GmMbvKG3Q/cI3EWgwlSyiQVhqFmhqRVsgBDFMs+VPSG34fU9DJnoxkt65oqOlDT6AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f28ffb96ed7524f76734012e85b4871d0a20cbe70ea8a3d940e76ce3845b6fa8","last_reissued_at":"2026-05-18T02:48:10.839374Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:48:10.839374Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"WordRep: A Benchmark for Research on Learning Word Representations","license":"http://creativecommons.org/licenses/by/3.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.CL","authors_text":"Bin Gao, Jiang Bian, Tie-Yan Liu","submitted_at":"2014-07-07T09:31:21Z","abstract_excerpt":"WordRep is a benchmark collection for the research on learning distributed word representations (or word embeddings), released by Microsoft Research. In this paper, we describe the details of the WordRep collection and show how to use it in different types of machine learning research related to word embedding. Specifically, we describe how the evaluation tasks in WordRep are selected, how the data are sampled, and how the evaluation tool is built. We then compare several state-of-the-art word representations on WordRep, report their evaluation performance, and make discussions on the results."},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1407.1640","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1407.1640","created_at":"2026-05-18T02:48:10.840137+00:00"},{"alias_kind":"arxiv_version","alias_value":"1407.1640v1","created_at":"2026-05-18T02:48:10.840137+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1407.1640","created_at":"2026-05-18T02:48:10.840137+00:00"},{"alias_kind":"pith_short_12","alias_value":"6KH7XFXNOUSP","created_at":"2026-05-18T12:28:16.859392+00:00"},{"alias_kind":"pith_short_16","alias_value":"6KH7XFXNOUSPOZZU","created_at":"2026-05-18T12:28:16.859392+00:00"},{"alias_kind":"pith_short_8","alias_value":"6KH7XFXN","created_at":"2026-05-18T12:28:16.859392+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU","json":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU.json","graph_json":"https://pith.science/api/pith-number/6KH7XFXNOUSPOZZUAEXILNEHDU/graph.json","events_json":"https://pith.science/api/pith-number/6KH7XFXNOUSPOZZUAEXILNEHDU/events.json","paper":"https://pith.science/paper/6KH7XFXN"},"agent_actions":{"view_html":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU","download_json":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU.json","view_paper":"https://pith.science/paper/6KH7XFXN","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1407.1640&json=true","fetch_graph":"https://pith.science/api/pith-number/6KH7XFXNOUSPOZZUAEXILNEHDU/graph.json","fetch_events":"https://pith.science/api/pith-number/6KH7XFXNOUSPOZZUAEXILNEHDU/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU/action/timestamp_anchor","attest_storage":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU/action/storage_attestation","attest_author":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU/action/author_attestation","sign_citation":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU/action/citation_signature","submit_replication":"https://pith.science/pith/6KH7XFXNOUSPOZZUAEXILNEHDU/action/replication_record"}},"created_at":"2026-05-18T02:48:10.840137+00:00","updated_at":"2026-05-18T02:48:10.840137+00:00"}