{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:542UXZLWD7NSC7Q7VIV4URMFKB","short_pith_number":"pith:542UXZLW","canonical_record":{"source":{"id":"1806.09614","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-25T12:06:28Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"6187d59d979fa54e6f91c73669f150ad6cc7820edbd5f809bc4704f1ace8c28a","abstract_canon_sha256":"352c2c253c263c895254acd8f017a2d4d4879f02f09d9480bed6b600b4461752"},"schema_version":"1.0"},"canonical_sha256":"ef354be5761fdb217e1faa2bca4585507848aee06a07d8b33d39e3a0a03c5247","source":{"kind":"arxiv","id":"1806.09614","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.09614","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"arxiv_version","alias_value":"1806.09614v2","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.09614","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"pith_short_12","alias_value":"542UXZLWD7NS","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"542UXZLWD7NSC7Q7","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"542UXZLW","created_at":"2026-05-18T12:32:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:542UXZLWD7NSC7Q7VIV4URMFKB","target":"record","payload":{"canonical_record":{"source":{"id":"1806.09614","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-25T12:06:28Z","cross_cats_sorted":["cs.AI","stat.ML"],"title_canon_sha256":"6187d59d979fa54e6f91c73669f150ad6cc7820edbd5f809bc4704f1ace8c28a","abstract_canon_sha256":"352c2c253c263c895254acd8f017a2d4d4879f02f09d9480bed6b600b4461752"},"schema_version":"1.0"},"canonical_sha256":"ef354be5761fdb217e1faa2bca4585507848aee06a07d8b33d39e3a0a03c5247","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:05:13.907915Z","signature_b64":"jaCdqyh/hcsxCa/4FKZXS5IwV17qEqlo1F+IUinaLh2X+eKo6yjZtL9rgEZ9L8rsnYTFwNJl4TpxQxHmtYUjCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ef354be5761fdb217e1faa2bca4585507848aee06a07d8b33d39e3a0a03c5247","last_reissued_at":"2026-05-18T00:05:13.907029Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:05:13.907029Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1806.09614","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uhyQtF8XrR+jSYw4qgrNnbUdYZ7X2U7cee20Yrj2VGbb4GxKTK49UMwBFdYFAP8UyTF9+en/3aHuXwZai3EJDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T18:51:09.231352Z"},"content_sha256":"b47c0816bcdecc8acb56c76527fb5b5a0e49956f9ac79306bad679dde9084940","schema_version":"1.0","event_id":"sha256:b47c0816bcdecc8acb56c76527fb5b5a0e49956f9ac79306bad679dde9084940"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:542UXZLWD7NSC7Q7VIV4URMFKB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Accuracy-based Curriculum Learning in Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","stat.ML"],"primary_cat":"cs.LG","authors_text":"Mohamed Chetouani, Olivier Sigaud, Pierre Fournier, Pierre-Yves Oudeyer","submitted_at":"2018-06-25T12:06:28Z","abstract_excerpt":"In this paper, we investigate a new form of automated curriculum learning based on adaptive selection of accuracy requirements, called accuracy-based curriculum learning. Using a reinforcement learning agent based on the Deep Deterministic Policy Gradient algorithm and addressing the Reacher environment, we first show that an agent trained with various accuracy requirements sampled randomly learns more efficiently than when asked to be very accurate at all times. Then we show that adaptive selection of accuracy requirements, based on a local measure of competence progress, automatically genera"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.09614","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IR4aStDw4boDw3K5d8TXQQiid6vAfzINE7sLiR1WQt8vWfhkg7Zu7BmFFPefqkshnJgPsYwImoqXXnBhWU7YAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T18:51:09.232096Z"},"content_sha256":"289c5d5200c227146759b4668441942c042c9aa50110782cc5a42df251fb819a","schema_version":"1.0","event_id":"sha256:289c5d5200c227146759b4668441942c042c9aa50110782cc5a42df251fb819a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/542UXZLWD7NSC7Q7VIV4URMFKB/bundle.json","state_url":"https://pith.science/pith/542UXZLWD7NSC7Q7VIV4URMFKB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/542UXZLWD7NSC7Q7VIV4URMFKB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T18:51:09Z","links":{"resolver":"https://pith.science/pith/542UXZLWD7NSC7Q7VIV4URMFKB","bundle":"https://pith.science/pith/542UXZLWD7NSC7Q7VIV4URMFKB/bundle.json","state":"https://pith.science/pith/542UXZLWD7NSC7Q7VIV4URMFKB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/542UXZLWD7NSC7Q7VIV4URMFKB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:542UXZLWD7NSC7Q7VIV4URMFKB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"352c2c253c263c895254acd8f017a2d4d4879f02f09d9480bed6b600b4461752","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-25T12:06:28Z","title_canon_sha256":"6187d59d979fa54e6f91c73669f150ad6cc7820edbd5f809bc4704f1ace8c28a"},"schema_version":"1.0","source":{"id":"1806.09614","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1806.09614","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"arxiv_version","alias_value":"1806.09614v2","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.09614","created_at":"2026-05-18T00:05:13Z"},{"alias_kind":"pith_short_12","alias_value":"542UXZLWD7NS","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"542UXZLWD7NSC7Q7","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"542UXZLW","created_at":"2026-05-18T12:32:05Z"}],"graph_snapshots":[{"event_id":"sha256:289c5d5200c227146759b4668441942c042c9aa50110782cc5a42df251fb819a","target":"graph","created_at":"2026-05-18T00:05:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper, we investigate a new form of automated curriculum learning based on adaptive selection of accuracy requirements, called accuracy-based curriculum learning. Using a reinforcement learning agent based on the Deep Deterministic Policy Gradient algorithm and addressing the Reacher environment, we first show that an agent trained with various accuracy requirements sampled randomly learns more efficiently than when asked to be very accurate at all times. Then we show that adaptive selection of accuracy requirements, based on a local measure of competence progress, automatically genera","authors_text":"Mohamed Chetouani, Olivier Sigaud, Pierre Fournier, Pierre-Yves Oudeyer","cross_cats":["cs.AI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-25T12:06:28Z","title":"Accuracy-based Curriculum Learning in Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.09614","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b47c0816bcdecc8acb56c76527fb5b5a0e49956f9ac79306bad679dde9084940","target":"record","created_at":"2026-05-18T00:05:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"352c2c253c263c895254acd8f017a2d4d4879f02f09d9480bed6b600b4461752","cross_cats_sorted":["cs.AI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-06-25T12:06:28Z","title_canon_sha256":"6187d59d979fa54e6f91c73669f150ad6cc7820edbd5f809bc4704f1ace8c28a"},"schema_version":"1.0","source":{"id":"1806.09614","kind":"arxiv","version":2}},"canonical_sha256":"ef354be5761fdb217e1faa2bca4585507848aee06a07d8b33d39e3a0a03c5247","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ef354be5761fdb217e1faa2bca4585507848aee06a07d8b33d39e3a0a03c5247","first_computed_at":"2026-05-18T00:05:13.907029Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:13.907029Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"jaCdqyh/hcsxCa/4FKZXS5IwV17qEqlo1F+IUinaLh2X+eKo6yjZtL9rgEZ9L8rsnYTFwNJl4TpxQxHmtYUjCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:13.907915Z","signed_message":"canonical_sha256_bytes"},"source_id":"1806.09614","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b47c0816bcdecc8acb56c76527fb5b5a0e49956f9ac79306bad679dde9084940","sha256:289c5d5200c227146759b4668441942c042c9aa50110782cc5a42df251fb819a"],"state_sha256":"f47e0055f1133ab311d13b8d7ba5f0fca4918e0c3bbb9c93806d17b2a3ee4ac9"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hiAJrsRPed1gm2ivPQH7emHj6XNiC4HL2XVbMwBgKNxglMa1jHyClc6MmoumPkrmO49zMsU+Rov3JSq5a5oYCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T18:51:09.235402Z","bundle_sha256":"b3662f77cd6b89d0560d6e9cba456f83102bed24ebac77e795423abc152beac0"}}