{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:YEBPGJVQ3ATKLN5Y2KGH5SX7UQ","short_pith_number":"pith:YEBPGJVQ","canonical_record":{"source":{"id":"1508.07709","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-08-31T07:52:50Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"74d5ed6993dc50d65a5344e34575f8d06c5078d355d18b10a6cb12bf6942a5b2","abstract_canon_sha256":"10d71ea217e9c97ae8ff5fdf48d533325a1174e01017b5a7a31602beda02648d"},"schema_version":"1.0"},"canonical_sha256":"c102f326b0d826a5b7b8d28c7ecaffa40a647d563b476c7bb86ff85a0f74c0ba","source":{"kind":"arxiv","id":"1508.07709","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.07709","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"arxiv_version","alias_value":"1508.07709v2","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.07709","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"pith_short_12","alias_value":"YEBPGJVQ3ATK","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"YEBPGJVQ3ATKLN5Y","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"YEBPGJVQ","created_at":"2026-05-18T12:29:50Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:YEBPGJVQ3ATKLN5Y2KGH5SX7UQ","target":"record","payload":{"canonical_record":{"source":{"id":"1508.07709","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-08-31T07:52:50Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"74d5ed6993dc50d65a5344e34575f8d06c5078d355d18b10a6cb12bf6942a5b2","abstract_canon_sha256":"10d71ea217e9c97ae8ff5fdf48d533325a1174e01017b5a7a31602beda02648d"},"schema_version":"1.0"},"canonical_sha256":"c102f326b0d826a5b7b8d28c7ecaffa40a647d563b476c7bb86ff85a0f74c0ba","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:21:15.741216Z","signature_b64":"w7KWNNG1/Ihw+tUXk3FIiYoTXC/OXtyhEIFTOhUsElna/jEYEwd6Y6XHocGtaJQ7F/Q0E155bSUq944yjndNCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c102f326b0d826a5b7b8d28c7ecaffa40a647d563b476c7bb86ff85a0f74c0ba","last_reissued_at":"2026-05-18T01:21:15.740537Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:21:15.740537Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1508.07709","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:21:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ovQT84C8h9CF6GgkA7QS01/uSADbKXyhTjQI+r9qQAvavpXLU7a7Ce76wQi2vL7VsUglOpKmfUniSRMpxSuGDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T10:38:54.286327Z"},"content_sha256":"ba81423e58ac56abc92869ac36c735868e2fc8ea018d846a49df883e5646cf28","schema_version":"1.0","event_id":"sha256:ba81423e58ac56abc92869ac36c735868e2fc8ea018d846a49df883e5646cf28"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:YEBPGJVQ3ATKLN5Y2KGH5SX7UQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Word Representations, Tree Models and Syntactic Functions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"cs.CL","authors_text":"Gertjan van Noord, Ivan Titov, Simon \\v{S}uster","submitted_at":"2015-08-31T07:52:50Z","abstract_excerpt":"Word representations induced from models with discrete latent variables (e.g.\\ HMMs) have been shown to be beneficial in many NLP applications. In this work, we exploit labeled syntactic dependency trees and formalize the induction problem as unsupervised learning of tree-structured hidden Markov models. Syntactic functions are used as additional observed variables in the model, influencing both transition and emission components. Such syntactic information can potentially lead to capturing more fine-grain and functional distinctions between words, which, in turn, may be desirable in many NLP "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.07709","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:21:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"frHrU/hFFDGd6WHsoTIM4UErUgJu06qzVDu6S3qRQKqC/Srvttlg18sEXF4bCTyB2qEkSq60mEjdJItUbnnxAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-04T10:38:54.286687Z"},"content_sha256":"d8f137f824579c85ec9d724e8c7c8b97960088e302ff1f3d8a76bb05900ba630","schema_version":"1.0","event_id":"sha256:d8f137f824579c85ec9d724e8c7c8b97960088e302ff1f3d8a76bb05900ba630"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/bundle.json","state_url":"https://pith.science/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-04T10:38:54Z","links":{"resolver":"https://pith.science/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ","bundle":"https://pith.science/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/bundle.json","state":"https://pith.science/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YEBPGJVQ3ATKLN5Y2KGH5SX7UQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:YEBPGJVQ3ATKLN5Y2KGH5SX7UQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"10d71ea217e9c97ae8ff5fdf48d533325a1174e01017b5a7a31602beda02648d","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-08-31T07:52:50Z","title_canon_sha256":"74d5ed6993dc50d65a5344e34575f8d06c5078d355d18b10a6cb12bf6942a5b2"},"schema_version":"1.0","source":{"id":"1508.07709","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.07709","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"arxiv_version","alias_value":"1508.07709v2","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.07709","created_at":"2026-05-18T01:21:15Z"},{"alias_kind":"pith_short_12","alias_value":"YEBPGJVQ3ATK","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"YEBPGJVQ3ATKLN5Y","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"YEBPGJVQ","created_at":"2026-05-18T12:29:50Z"}],"graph_snapshots":[{"event_id":"sha256:d8f137f824579c85ec9d724e8c7c8b97960088e302ff1f3d8a76bb05900ba630","target":"graph","created_at":"2026-05-18T01:21:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Word representations induced from models with discrete latent variables (e.g.\\ HMMs) have been shown to be beneficial in many NLP applications. In this work, we exploit labeled syntactic dependency trees and formalize the induction problem as unsupervised learning of tree-structured hidden Markov models. Syntactic functions are used as additional observed variables in the model, influencing both transition and emission components. Such syntactic information can potentially lead to capturing more fine-grain and functional distinctions between words, which, in turn, may be desirable in many NLP ","authors_text":"Gertjan van Noord, Ivan Titov, Simon \\v{S}uster","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-08-31T07:52:50Z","title":"Word Representations, Tree Models and Syntactic Functions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.07709","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ba81423e58ac56abc92869ac36c735868e2fc8ea018d846a49df883e5646cf28","target":"record","created_at":"2026-05-18T01:21:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"10d71ea217e9c97ae8ff5fdf48d533325a1174e01017b5a7a31602beda02648d","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2015-08-31T07:52:50Z","title_canon_sha256":"74d5ed6993dc50d65a5344e34575f8d06c5078d355d18b10a6cb12bf6942a5b2"},"schema_version":"1.0","source":{"id":"1508.07709","kind":"arxiv","version":2}},"canonical_sha256":"c102f326b0d826a5b7b8d28c7ecaffa40a647d563b476c7bb86ff85a0f74c0ba","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c102f326b0d826a5b7b8d28c7ecaffa40a647d563b476c7bb86ff85a0f74c0ba","first_computed_at":"2026-05-18T01:21:15.740537Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:21:15.740537Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"w7KWNNG1/Ihw+tUXk3FIiYoTXC/OXtyhEIFTOhUsElna/jEYEwd6Y6XHocGtaJQ7F/Q0E155bSUq944yjndNCg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:21:15.741216Z","signed_message":"canonical_sha256_bytes"},"source_id":"1508.07709","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ba81423e58ac56abc92869ac36c735868e2fc8ea018d846a49df883e5646cf28","sha256:d8f137f824579c85ec9d724e8c7c8b97960088e302ff1f3d8a76bb05900ba630"],"state_sha256":"f3a4159e1e43b39cccefc94b5512c8fe189c620aae2971322aa4a26b9b75346b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+LO2kdLdgPzEhJeWshuS6oUybem2lQ9XOsuZuiu9TYAUEH+kuRBDTniza74h9ZYVoQW7GSDrxu/9Shg9QLbkCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-04T10:38:54.288576Z","bundle_sha256":"b16fbeaee87502016e7cae62ca17d48c543ba2be28c35bed85965d175ca017f6"}}