{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:MX6PVA6RR6JJKFMMW63Y52XRFK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7828b622782106d31d159965832849e39db7a606d16e0b425a89e9e2531fe1b0","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-09-13T17:21:56Z","title_canon_sha256":"a933ddc503c5061ca23b93dd65e83cc29cfb335f71465de9599b78e50af53813"},"schema_version":"1.0","source":{"id":"1809.06227","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.06227","created_at":"2026-05-18T00:05:35Z"},{"alias_kind":"arxiv_version","alias_value":"1809.06227v1","created_at":"2026-05-18T00:05:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.06227","created_at":"2026-05-18T00:05:35Z"},{"alias_kind":"pith_short_12","alias_value":"MX6PVA6RR6JJ","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_16","alias_value":"MX6PVA6RR6JJKFMM","created_at":"2026-05-18T12:32:40Z"},{"alias_kind":"pith_short_8","alias_value":"MX6PVA6R","created_at":"2026-05-18T12:32:40Z"}],"graph_snapshots":[{"event_id":"sha256:5f06c93422a12be253b1f7ecac3e6a0b250e977b7123a302fad00a260160021a","target":"graph","created_at":"2026-05-18T00:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recently, Reinforcement Learning (RL) approaches have demonstrated advanced performance in image captioning by directly optimizing the metric used for testing. However, this shaped reward introduces learning biases, which reduces the readability of generated text. In addition, the large sample space makes training unstable and slow. To alleviate these issues, we propose a simple coherent solution that constrains the action space using an n-gram language prior. Quantitative and qualitative evaluations on benchmarks show that RL with the simple add-on module performs favorably against its counte","authors_text":"Kun Bai, Mo Yu, Shiyu Chang, Tszhang Guo","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-09-13T17:21:56Z","title":"Improving Reinforcement Learning Based Image Captioning with Natural Language Prior"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.06227","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f62ddc68140ac9c9e4e2c212ced75ac05d7b56c646ac560c4f57092c1504b5f2","target":"record","created_at":"2026-05-18T00:05:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7828b622782106d31d159965832849e39db7a606d16e0b425a89e9e2531fe1b0","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-09-13T17:21:56Z","title_canon_sha256":"a933ddc503c5061ca23b93dd65e83cc29cfb335f71465de9599b78e50af53813"},"schema_version":"1.0","source":{"id":"1809.06227","kind":"arxiv","version":1}},"canonical_sha256":"65fcfa83d18f9295158cb7b78eeaf12a82c4f6b3d75f0e8c6c5e037580107b83","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"65fcfa83d18f9295158cb7b78eeaf12a82c4f6b3d75f0e8c6c5e037580107b83","first_computed_at":"2026-05-18T00:05:35.262415Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:35.262415Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"sm7HRWn5IFZFFwwSWr632H3lrvlZ4Z2mNEeM+gCLs+HljdYLhrnOWawWrJDtoP64m5WJE/gEac0lzM6KcZs2AA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:35.263377Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.06227","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f62ddc68140ac9c9e4e2c212ced75ac05d7b56c646ac560c4f57092c1504b5f2","sha256:5f06c93422a12be253b1f7ecac3e6a0b250e977b7123a302fad00a260160021a"],"state_sha256":"09899d750be80a8fe533ef753b210d451e76cc1cded1224ce41317882c93c485"}