{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:CXECS5QE62BM266WAFE3DNFFYN","short_pith_number":"pith:CXECS5QE","canonical_record":{"source":{"id":"1807.02371","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-06T12:08:53Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"b5344ed9a1293f752846997836a6005488aa23068439c954db6ca4f3dabfb328","abstract_canon_sha256":"0a286bdd98e61a16f12a22dc63d694459da45d01d6ecf7593cca59dfdfcbbbb0"},"schema_version":"1.0"},"canonical_sha256":"15c8297604f682cd7bd60149b1b4a5c34cfe469be4f8ca8cf332fa0f4ceceb0b","source":{"kind":"arxiv","id":"1807.02371","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.02371","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"arxiv_version","alias_value":"1807.02371v2","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.02371","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"pith_short_12","alias_value":"CXECS5QE62BM","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"CXECS5QE62BM266W","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"CXECS5QE","created_at":"2026-05-18T12:32:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:CXECS5QE62BM266WAFE3DNFFYN","target":"record","payload":{"canonical_record":{"source":{"id":"1807.02371","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-06T12:08:53Z","cross_cats_sorted":["cs.RO"],"title_canon_sha256":"b5344ed9a1293f752846997836a6005488aa23068439c954db6ca4f3dabfb328","abstract_canon_sha256":"0a286bdd98e61a16f12a22dc63d694459da45d01d6ecf7593cca59dfdfcbbbb0"},"schema_version":"1.0"},"canonical_sha256":"15c8297604f682cd7bd60149b1b4a5c34cfe469be4f8ca8cf332fa0f4ceceb0b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:06:45.841981Z","signature_b64":"RH9p3O+AcpYJO5nkNNogRGJGvckmVqtFGrK+Dt2sfLzolPsx+DSN7r7cYiFKC6xxbgUdFvHlYltFGOABgZWKCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"15c8297604f682cd7bd60149b1b4a5c34cfe469be4f8ca8cf332fa0f4ceceb0b","last_reissued_at":"2026-05-18T00:06:45.841371Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:06:45.841371Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1807.02371","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:06:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"a2PWxEHC3V8l4IOPWZENCgRFJGRO8sXmy+8WKfHR85j+8hTMbNE9y6neD+qiLnTkWNEVU4hAouUjsBYPZKkiCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T13:03:21.739903Z"},"content_sha256":"3282d75798bce8e969102bcafc138915e1640dd1a0e7bdbde01047e0abc0660a","schema_version":"1.0","event_id":"sha256:3282d75798bce8e969102bcafc138915e1640dd1a0e7bdbde01047e0abc0660a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:CXECS5QE62BM266WAFE3DNFFYN","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"End-to-End Race Driving with Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.RO"],"primary_cat":"cs.CV","authors_text":"Etienne Perot, Fawzi Nashashibi, Marin Toromanoff, Maximilian Jaritz, Raoul de Charette","submitted_at":"2018-07-06T12:08:53Z","abstract_excerpt":"We present research using the latest reinforcement learning algorithm for end-to-end driving without any mediated perception (object recognition, scene understanding). The newly proposed reward and learning strategies lead together to faster convergence and more robust driving using only RGB image from a forward facing camera. An Asynchronous Actor Critic (A3C) framework is used to learn the car control in a physically and graphically realistic rally game, with the agents evolving simultaneously on tracks with a variety of road structures (turns, hills), graphics (seasons, location) and physic"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.02371","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:06:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kmjoUdXxztCPAW8PBX35alF+GydMI1ZA9LvCIiMQWkmcx6yGQv8Ya4cTwZFWOS/iKwQ1zxb/DcnyOlh5H19CAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T13:03:21.740332Z"},"content_sha256":"9d6ac11849c5461b1592547a4b463153a0f6dbb2163a443ff81805806f849992","schema_version":"1.0","event_id":"sha256:9d6ac11849c5461b1592547a4b463153a0f6dbb2163a443ff81805806f849992"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CXECS5QE62BM266WAFE3DNFFYN/bundle.json","state_url":"https://pith.science/pith/CXECS5QE62BM266WAFE3DNFFYN/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CXECS5QE62BM266WAFE3DNFFYN/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T13:03:21Z","links":{"resolver":"https://pith.science/pith/CXECS5QE62BM266WAFE3DNFFYN","bundle":"https://pith.science/pith/CXECS5QE62BM266WAFE3DNFFYN/bundle.json","state":"https://pith.science/pith/CXECS5QE62BM266WAFE3DNFFYN/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CXECS5QE62BM266WAFE3DNFFYN/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:CXECS5QE62BM266WAFE3DNFFYN","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0a286bdd98e61a16f12a22dc63d694459da45d01d6ecf7593cca59dfdfcbbbb0","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-06T12:08:53Z","title_canon_sha256":"b5344ed9a1293f752846997836a6005488aa23068439c954db6ca4f3dabfb328"},"schema_version":"1.0","source":{"id":"1807.02371","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.02371","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"arxiv_version","alias_value":"1807.02371v2","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.02371","created_at":"2026-05-18T00:06:45Z"},{"alias_kind":"pith_short_12","alias_value":"CXECS5QE62BM","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"CXECS5QE62BM266W","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"CXECS5QE","created_at":"2026-05-18T12:32:19Z"}],"graph_snapshots":[{"event_id":"sha256:9d6ac11849c5461b1592547a4b463153a0f6dbb2163a443ff81805806f849992","target":"graph","created_at":"2026-05-18T00:06:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We present research using the latest reinforcement learning algorithm for end-to-end driving without any mediated perception (object recognition, scene understanding). The newly proposed reward and learning strategies lead together to faster convergence and more robust driving using only RGB image from a forward facing camera. An Asynchronous Actor Critic (A3C) framework is used to learn the car control in a physically and graphically realistic rally game, with the agents evolving simultaneously on tracks with a variety of road structures (turns, hills), graphics (seasons, location) and physic","authors_text":"Etienne Perot, Fawzi Nashashibi, Marin Toromanoff, Maximilian Jaritz, Raoul de Charette","cross_cats":["cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-06T12:08:53Z","title":"End-to-End Race Driving with Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.02371","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3282d75798bce8e969102bcafc138915e1640dd1a0e7bdbde01047e0abc0660a","target":"record","created_at":"2026-05-18T00:06:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0a286bdd98e61a16f12a22dc63d694459da45d01d6ecf7593cca59dfdfcbbbb0","cross_cats_sorted":["cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-06T12:08:53Z","title_canon_sha256":"b5344ed9a1293f752846997836a6005488aa23068439c954db6ca4f3dabfb328"},"schema_version":"1.0","source":{"id":"1807.02371","kind":"arxiv","version":2}},"canonical_sha256":"15c8297604f682cd7bd60149b1b4a5c34cfe469be4f8ca8cf332fa0f4ceceb0b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"15c8297604f682cd7bd60149b1b4a5c34cfe469be4f8ca8cf332fa0f4ceceb0b","first_computed_at":"2026-05-18T00:06:45.841371Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:06:45.841371Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"RH9p3O+AcpYJO5nkNNogRGJGvckmVqtFGrK+Dt2sfLzolPsx+DSN7r7cYiFKC6xxbgUdFvHlYltFGOABgZWKCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:06:45.841981Z","signed_message":"canonical_sha256_bytes"},"source_id":"1807.02371","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3282d75798bce8e969102bcafc138915e1640dd1a0e7bdbde01047e0abc0660a","sha256:9d6ac11849c5461b1592547a4b463153a0f6dbb2163a443ff81805806f849992"],"state_sha256":"b041ea1b07a22d7afa7128eb207d2f4eb14986f1d47822cfaf01f8fa0e3bfc9e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"O56UA8QAzVKzyqzsofcDicDWYnDN08bxYKjB16tn4Medc//B51BSXxxML23UJLkVoeV879Rd6BT68Km0ZLuFAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T13:03:21.743865Z","bundle_sha256":"1411bf5443b9308f1509a6ea632c9821acb13665d55faaccf802a51970f4fc26"}}