{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:MY52NY7T4F4FEGK65SL6HDHLYR","short_pith_number":"pith:MY52NY7T","canonical_record":{"source":{"id":"1609.00150","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-09-01T09:00:19Z","cross_cats_sorted":[],"title_canon_sha256":"9bc3df3ebea6fc593fd8ffbfb674186e90896c4d5dca6beb636393a3efee2cdb","abstract_canon_sha256":"17373e4f70f0abbaf8048bf5c7a5f403543dc20fe2e2f2bf8a020a60834080de"},"schema_version":"1.0"},"canonical_sha256":"663ba6e3f3e17852195eec97e38cebc4601ed7ae1b049fe0bb1d947dea12c1cf","source":{"kind":"arxiv","id":"1609.00150","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1609.00150","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"arxiv_version","alias_value":"1609.00150v3","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1609.00150","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"pith_short_12","alias_value":"MY52NY7T4F4F","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"MY52NY7T4F4FEGK6","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"MY52NY7T","created_at":"2026-05-18T12:30:32Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:MY52NY7T4F4FEGK65SL6HDHLYR","target":"record","payload":{"canonical_record":{"source":{"id":"1609.00150","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-09-01T09:00:19Z","cross_cats_sorted":[],"title_canon_sha256":"9bc3df3ebea6fc593fd8ffbfb674186e90896c4d5dca6beb636393a3efee2cdb","abstract_canon_sha256":"17373e4f70f0abbaf8048bf5c7a5f403543dc20fe2e2f2bf8a020a60834080de"},"schema_version":"1.0"},"canonical_sha256":"663ba6e3f3e17852195eec97e38cebc4601ed7ae1b049fe0bb1d947dea12c1cf","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:53:24.251417Z","signature_b64":"4gpoKa8/b/brmRciGpIsKAs2PQWKAq4a9ZAVQ4aev/1E58PXME2g5E8aeo9HU5RKpqht4kKwiVsvmwT8IdwfAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"663ba6e3f3e17852195eec97e38cebc4601ed7ae1b049fe0bb1d947dea12c1cf","last_reissued_at":"2026-05-18T00:53:24.250947Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:53:24.250947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1609.00150","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:53:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/FEKqJeNO4aFi9540P+/Z9B3VLQp4z4PvRP/mloNAQj0NeMgdpFux3qp4EuAZ0U69qXHB6qENwdCW8lNmL9tBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:18:29.248156Z"},"content_sha256":"baa7487d812b9ed7ff86f47f9b50e3c84dc672c4893e409ee74ee180351ef9c8","schema_version":"1.0","event_id":"sha256:baa7487d812b9ed7ff86f47f9b50e3c84dc672c4893e409ee74ee180351ef9c8"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:MY52NY7T4F4FEGK65SL6HDHLYR","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Reward Augmented Maximum Likelihood for Neural Structured Prediction","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Dale Schuurmans, Mike Schuster, Mohammad Norouzi, Navdeep Jaitly, Samy Bengio, Yonghui Wu, Zhifeng Chen","submitted_at":"2016-09-01T09:00:19Z","abstract_excerpt":"A key problem in structured output prediction is direct optimization of the task reward function that matters for test evaluation. This paper presents a simple and computationally efficient approach to incorporate task reward into a maximum likelihood framework. By establishing a link between the log-likelihood and expected reward objectives, we show that an optimal regularized expected reward is achieved when the conditional distribution of the outputs given the inputs is proportional to their exponentiated scaled rewards. Accordingly, we present a framework to smooth the predictive probabili"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1609.00150","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:53:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dtLS099WJauAgJmp3pNM/2V6wsVMNb9dY9c2lKOJ56pamyOJ2iBij+uhG87Hd7Vd6bo3uMLi0PfMzDEHwZbwDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:18:29.248594Z"},"content_sha256":"fd7ad0521ec7331847e33c774cc9cd4135a797f76a8c1bc4a168e75f7f6dd54d","schema_version":"1.0","event_id":"sha256:fd7ad0521ec7331847e33c774cc9cd4135a797f76a8c1bc4a168e75f7f6dd54d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/MY52NY7T4F4FEGK65SL6HDHLYR/bundle.json","state_url":"https://pith.science/pith/MY52NY7T4F4FEGK65SL6HDHLYR/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/MY52NY7T4F4FEGK65SL6HDHLYR/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T23:18:29Z","links":{"resolver":"https://pith.science/pith/MY52NY7T4F4FEGK65SL6HDHLYR","bundle":"https://pith.science/pith/MY52NY7T4F4FEGK65SL6HDHLYR/bundle.json","state":"https://pith.science/pith/MY52NY7T4F4FEGK65SL6HDHLYR/state.json","well_known_bundle":"https://pith.science/.well-known/pith/MY52NY7T4F4FEGK65SL6HDHLYR/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:MY52NY7T4F4FEGK65SL6HDHLYR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"17373e4f70f0abbaf8048bf5c7a5f403543dc20fe2e2f2bf8a020a60834080de","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-09-01T09:00:19Z","title_canon_sha256":"9bc3df3ebea6fc593fd8ffbfb674186e90896c4d5dca6beb636393a3efee2cdb"},"schema_version":"1.0","source":{"id":"1609.00150","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1609.00150","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"arxiv_version","alias_value":"1609.00150v3","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1609.00150","created_at":"2026-05-18T00:53:24Z"},{"alias_kind":"pith_short_12","alias_value":"MY52NY7T4F4F","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_16","alias_value":"MY52NY7T4F4FEGK6","created_at":"2026-05-18T12:30:32Z"},{"alias_kind":"pith_short_8","alias_value":"MY52NY7T","created_at":"2026-05-18T12:30:32Z"}],"graph_snapshots":[{"event_id":"sha256:fd7ad0521ec7331847e33c774cc9cd4135a797f76a8c1bc4a168e75f7f6dd54d","target":"graph","created_at":"2026-05-18T00:53:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"A key problem in structured output prediction is direct optimization of the task reward function that matters for test evaluation. This paper presents a simple and computationally efficient approach to incorporate task reward into a maximum likelihood framework. By establishing a link between the log-likelihood and expected reward objectives, we show that an optimal regularized expected reward is achieved when the conditional distribution of the outputs given the inputs is proportional to their exponentiated scaled rewards. Accordingly, we present a framework to smooth the predictive probabili","authors_text":"Dale Schuurmans, Mike Schuster, Mohammad Norouzi, Navdeep Jaitly, Samy Bengio, Yonghui Wu, Zhifeng Chen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-09-01T09:00:19Z","title":"Reward Augmented Maximum Likelihood for Neural Structured Prediction"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1609.00150","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:baa7487d812b9ed7ff86f47f9b50e3c84dc672c4893e409ee74ee180351ef9c8","target":"record","created_at":"2026-05-18T00:53:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"17373e4f70f0abbaf8048bf5c7a5f403543dc20fe2e2f2bf8a020a60834080de","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-09-01T09:00:19Z","title_canon_sha256":"9bc3df3ebea6fc593fd8ffbfb674186e90896c4d5dca6beb636393a3efee2cdb"},"schema_version":"1.0","source":{"id":"1609.00150","kind":"arxiv","version":3}},"canonical_sha256":"663ba6e3f3e17852195eec97e38cebc4601ed7ae1b049fe0bb1d947dea12c1cf","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"663ba6e3f3e17852195eec97e38cebc4601ed7ae1b049fe0bb1d947dea12c1cf","first_computed_at":"2026-05-18T00:53:24.250947Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:53:24.250947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"4gpoKa8/b/brmRciGpIsKAs2PQWKAq4a9ZAVQ4aev/1E58PXME2g5E8aeo9HU5RKpqht4kKwiVsvmwT8IdwfAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:53:24.251417Z","signed_message":"canonical_sha256_bytes"},"source_id":"1609.00150","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:baa7487d812b9ed7ff86f47f9b50e3c84dc672c4893e409ee74ee180351ef9c8","sha256:fd7ad0521ec7331847e33c774cc9cd4135a797f76a8c1bc4a168e75f7f6dd54d"],"state_sha256":"62cf8bce37cc8eaa0710bbcb714f63c83f002c07fe360c42c0ab716f7ab9042f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yGUdAl2VmGbs+2VnI4z7boA2bbb9dgkcdJzA8hOYtqa7DNyP7rNWNw4sP6lMDuKtddZvbeEGp2gx4OujZy3eCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T23:18:29.250933Z","bundle_sha256":"3f7b7b0b296b683e1523859d07e3d851afb734d1544327ce86520dffa57f0ae8"}}