{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:QQADI7SPGU3VVV7NLXNICQQAIZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7e0f9767ed6382a0bfdde667ab0bb95ea08818aa3c8158ff8aa1f7f8cf370c90","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-15T06:18:33Z","title_canon_sha256":"5a6dfc408a56513b76c732e28203234add7b6db3ca0e002d3e4c52457df36aa2"},"schema_version":"1.0","source":{"id":"1709.05067","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.05067","created_at":"2026-05-18T00:35:06Z"},{"alias_kind":"arxiv_version","alias_value":"1709.05067v1","created_at":"2026-05-18T00:35:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.05067","created_at":"2026-05-18T00:35:06Z"},{"alias_kind":"pith_short_12","alias_value":"QQADI7SPGU3V","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_16","alias_value":"QQADI7SPGU3VVV7N","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_8","alias_value":"QQADI7SP","created_at":"2026-05-18T12:31:39Z"}],"graph_snapshots":[{"event_id":"sha256:f5e81bd74a1e5c22f61727fc31abf96e478926cb08cbcffcc0b35c391b071c6b","target":"graph","created_at":"2026-05-18T00:35:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Deep reinforcement learning is revolutionizing the artificial intelligence field. Currently, it serves as a good starting point for constructing intelligent autonomous systems which offer a better knowledge of the visual world. It is possible to scale deep reinforcement learning with the use of deep learning and do amazing tasks such as use of pixels in playing video games. In this paper, key concepts of deep reinforcement learning including reward function, differences between reinforcement learning and supervised learning and models for implementation of reinforcement are discussed. Key chal","authors_text":"Agam Shah, Mahipal Jadeja, Neelanshi Varia","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-15T06:18:33Z","title":"Deep Reinforcement Learning for Conversational AI"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.05067","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a30b093fb9a5cd222017ce482f7ab8e16e9b1dce7b16467896ec2f89ed5f2082","target":"record","created_at":"2026-05-18T00:35:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7e0f9767ed6382a0bfdde667ab0bb95ea08818aa3c8158ff8aa1f7f8cf370c90","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-15T06:18:33Z","title_canon_sha256":"5a6dfc408a56513b76c732e28203234add7b6db3ca0e002d3e4c52457df36aa2"},"schema_version":"1.0","source":{"id":"1709.05067","kind":"arxiv","version":1}},"canonical_sha256":"8400347e4f35375ad7ed5dda814200464d0954612d672c3d613bbbc26c429dd4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8400347e4f35375ad7ed5dda814200464d0954612d672c3d613bbbc26c429dd4","first_computed_at":"2026-05-18T00:35:06.793482Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:35:06.793482Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"igJA/zqt7akArgREKrrDYGn0x+LjnNj99hEYDz3PAAaWkF3JqGyQS/vX/fpr1+dEWhI/sbExgFkRusl2ISSxCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:35:06.794002Z","signed_message":"canonical_sha256_bytes"},"source_id":"1709.05067","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a30b093fb9a5cd222017ce482f7ab8e16e9b1dce7b16467896ec2f89ed5f2082","sha256:f5e81bd74a1e5c22f61727fc31abf96e478926cb08cbcffcc0b35c391b071c6b"],"state_sha256":"95f294edd58c41f797a7eb140445fff090bd55857a6b9283479a6849d09cc3cb"}