{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:LH2GS6VEUWYXUOIWIA7EV5OI7N","short_pith_number":"pith:LH2GS6VE","canonical_record":{"source":{"id":"1712.00006","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T03:40:06Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c04847203a92848a03a350a0942a3a0380fbb08a82d85db901f10af798a61172","abstract_canon_sha256":"3001d23ea920dfe4ea0fb4b4f1e499783620c6e1a2de9ea45c8f23440a042a46"},"schema_version":"1.0"},"canonical_sha256":"59f4697aa4a5b17a3916403e4af5c8fb42265d5a0dad3c60ed5ad188ad3f521a","source":{"kind":"arxiv","id":"1712.00006","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.00006","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"arxiv_version","alias_value":"1712.00006v2","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.00006","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"pith_short_12","alias_value":"LH2GS6VEUWYX","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LH2GS6VEUWYXUOIW","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LH2GS6VE","created_at":"2026-05-18T12:31:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:LH2GS6VEUWYXUOIWIA7EV5OI7N","target":"record","payload":{"canonical_record":{"source":{"id":"1712.00006","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T03:40:06Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"c04847203a92848a03a350a0942a3a0380fbb08a82d85db901f10af798a61172","abstract_canon_sha256":"3001d23ea920dfe4ea0fb4b4f1e499783620c6e1a2de9ea45c8f23440a042a46"},"schema_version":"1.0"},"canonical_sha256":"59f4697aa4a5b17a3916403e4af5c8fb42265d5a0dad3c60ed5ad188ad3f521a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:21:50.741097Z","signature_b64":"fFUzIixEHOEAB0XiyhkJLtwq4z836UV/71FYrr0kqQ5nL0DLkR7AgfXgYmLFV7nEA1OBlRFL1Ccfr5ELTcehAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"59f4697aa4a5b17a3916403e4af5c8fb42265d5a0dad3c60ed5ad188ad3f521a","last_reissued_at":"2026-05-18T00:21:50.740512Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:21:50.740512Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1712.00006","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MU2TTJ9hbPQizlVOPotslDPC/sEhXsG77mjHgt3cGVr3RR6UTX2XIL4IYDVZe11q/bNcL8i+qER9RljQoxquCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T11:18:07.557705Z"},"content_sha256":"67cab7794a905ea6a3d0320f13f8c8087de12b270f6aa923676ab92737e0284f","schema_version":"1.0","event_id":"sha256:67cab7794a905ea6a3d0320f13f8c8087de12b270f6aa923676ab92737e0284f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:LH2GS6VEUWYXUOIWIA7EV5OI7N","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Comparing Deep Reinforcement Learning and Evolutionary Methods in Continuous Control","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Osmar R. Zaiane, Shangtong Zhang","submitted_at":"2017-11-30T03:40:06Z","abstract_excerpt":"Reinforcement Learning and the Evolutionary Strategy are two major approaches in addressing complicated control problems. Both are strong contenders and have their own devotee communities. Both groups have been very active in developing new advances in their own domain and devising, in recent years, leading-edge techniques to address complex continuous control tasks. Here, in the context of Deep Reinforcement Learning, we formulate a parallelized version of the Proximal Policy Optimization method and a Deep Deterministic Policy Gradient method. Moreover, we conduct a thorough comparison betwee"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.00006","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AtSXzb/RpCMAgr0bGIl/tR223Bph8RCvxGmKUi4f/q5xvKUh8gWC1CcpThxt8nUdl5WgESaDaOZ9bIoeONJ4AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T11:18:07.558263Z"},"content_sha256":"8b7deb951249a2d95d2a6fe69749d6ab6a88b679aa74d94b161e48525af81ca3","schema_version":"1.0","event_id":"sha256:8b7deb951249a2d95d2a6fe69749d6ab6a88b679aa74d94b161e48525af81ca3"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/bundle.json","state_url":"https://pith.science/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T11:18:07Z","links":{"resolver":"https://pith.science/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N","bundle":"https://pith.science/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/bundle.json","state":"https://pith.science/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LH2GS6VEUWYXUOIWIA7EV5OI7N/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:LH2GS6VEUWYXUOIWIA7EV5OI7N","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3001d23ea920dfe4ea0fb4b4f1e499783620c6e1a2de9ea45c8f23440a042a46","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T03:40:06Z","title_canon_sha256":"c04847203a92848a03a350a0942a3a0380fbb08a82d85db901f10af798a61172"},"schema_version":"1.0","source":{"id":"1712.00006","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.00006","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"arxiv_version","alias_value":"1712.00006v2","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.00006","created_at":"2026-05-18T00:21:50Z"},{"alias_kind":"pith_short_12","alias_value":"LH2GS6VEUWYX","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_16","alias_value":"LH2GS6VEUWYXUOIW","created_at":"2026-05-18T12:31:28Z"},{"alias_kind":"pith_short_8","alias_value":"LH2GS6VE","created_at":"2026-05-18T12:31:28Z"}],"graph_snapshots":[{"event_id":"sha256:8b7deb951249a2d95d2a6fe69749d6ab6a88b679aa74d94b161e48525af81ca3","target":"graph","created_at":"2026-05-18T00:21:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Reinforcement Learning and the Evolutionary Strategy are two major approaches in addressing complicated control problems. Both are strong contenders and have their own devotee communities. Both groups have been very active in developing new advances in their own domain and devising, in recent years, leading-edge techniques to address complex continuous control tasks. Here, in the context of Deep Reinforcement Learning, we formulate a parallelized version of the Proximal Policy Optimization method and a Deep Deterministic Policy Gradient method. Moreover, we conduct a thorough comparison betwee","authors_text":"Osmar R. Zaiane, Shangtong Zhang","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T03:40:06Z","title":"Comparing Deep Reinforcement Learning and Evolutionary Methods in Continuous Control"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.00006","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:67cab7794a905ea6a3d0320f13f8c8087de12b270f6aa923676ab92737e0284f","target":"record","created_at":"2026-05-18T00:21:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3001d23ea920dfe4ea0fb4b4f1e499783620c6e1a2de9ea45c8f23440a042a46","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2017-11-30T03:40:06Z","title_canon_sha256":"c04847203a92848a03a350a0942a3a0380fbb08a82d85db901f10af798a61172"},"schema_version":"1.0","source":{"id":"1712.00006","kind":"arxiv","version":2}},"canonical_sha256":"59f4697aa4a5b17a3916403e4af5c8fb42265d5a0dad3c60ed5ad188ad3f521a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"59f4697aa4a5b17a3916403e4af5c8fb42265d5a0dad3c60ed5ad188ad3f521a","first_computed_at":"2026-05-18T00:21:50.740512Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:21:50.740512Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"fFUzIixEHOEAB0XiyhkJLtwq4z836UV/71FYrr0kqQ5nL0DLkR7AgfXgYmLFV7nEA1OBlRFL1Ccfr5ELTcehAA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:21:50.741097Z","signed_message":"canonical_sha256_bytes"},"source_id":"1712.00006","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:67cab7794a905ea6a3d0320f13f8c8087de12b270f6aa923676ab92737e0284f","sha256:8b7deb951249a2d95d2a6fe69749d6ab6a88b679aa74d94b161e48525af81ca3"],"state_sha256":"01c03f26a0802c7ad10703bba553c6900f20dc6caae80f2e59f777a85caf7ed0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bpKG0CHG/OE7Ob0rb0YFi1vG2I8PXBoCbeOB85k1HIIykcX3Xjxu+gVoRFLFeOOeEMym6pyYJT33dsLbr+/pDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T11:18:07.561671Z","bundle_sha256":"397620c8b62ebb263c443b88ff020035815d22b9f975fb013614e021409d838e"}}