{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:R2EN443B4V5EKAOMJHEAJ3Q5RP","short_pith_number":"pith:R2EN443B","canonical_record":{"source":{"id":"1703.02239","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-03-07T06:51:19Z","cross_cats_sorted":[],"title_canon_sha256":"aec34bd16f71e227825c0a18c01fb24c95c78423367a6b148f32a15712c6f015","abstract_canon_sha256":"47dee670c55e3764758289ff5cf3a07f86f3b4b398a18a47e9ecbcaefe576d56"},"schema_version":"1.0"},"canonical_sha256":"8e88de7361e57a4501cc49c804ee1d8bc2566ca637cf7f8adc3a170b2b57d6ce","source":{"kind":"arxiv","id":"1703.02239","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.02239","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"arxiv_version","alias_value":"1703.02239v2","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.02239","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"pith_short_12","alias_value":"R2EN443B4V5E","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_16","alias_value":"R2EN443B4V5EKAOM","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_8","alias_value":"R2EN443B","created_at":"2026-05-18T12:31:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:R2EN443B4V5EKAOMJHEAJ3Q5RP","target":"record","payload":{"canonical_record":{"source":{"id":"1703.02239","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-03-07T06:51:19Z","cross_cats_sorted":[],"title_canon_sha256":"aec34bd16f71e227825c0a18c01fb24c95c78423367a6b148f32a15712c6f015","abstract_canon_sha256":"47dee670c55e3764758289ff5cf3a07f86f3b4b398a18a47e9ecbcaefe576d56"},"schema_version":"1.0"},"canonical_sha256":"8e88de7361e57a4501cc49c804ee1d8bc2566ca637cf7f8adc3a170b2b57d6ce","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:44:23.340795Z","signature_b64":"20zr0ztLnoC8lfgTZp7Egow6t5qYd04bf3SPROYzORf68INkkP0NrLftTlzcYgqt38VN/QD8OqffMVArS1z9Bw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8e88de7361e57a4501cc49c804ee1d8bc2566ca637cf7f8adc3a170b2b57d6ce","last_reissued_at":"2026-05-18T00:44:23.340337Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:44:23.340337Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1703.02239","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"fiHlUFJKF9Djv9uySYq0sejERLztxaDrAjiO2/r7D5y0qvQwzk9pVx4rFMAKfgYMI5Uvc1Jje+CKegENOuTSCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T07:32:43.396854Z"},"content_sha256":"c5b19ff32e839f2a4f515d038a9e120262af094e745fb6ce60daf58e74ec77a5","schema_version":"1.0","event_id":"sha256:c5b19ff32e839f2a4f515d038a9e120262af094e745fb6ce60daf58e74ec77a5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:R2EN443B4V5EKAOMJHEAJ3Q5RP","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Functions that Emerge through End-to-End Reinforcement Learning - The Direction for Artificial General Intelligence -","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Katsunari Shibata","submitted_at":"2017-03-07T06:51:19Z","abstract_excerpt":"Recently, triggered by the impressive results in TV-games or game of Go by Google DeepMind, end-to-end reinforcement learning (RL) is collecting attentions. Although little is known, the author's group has propounded this framework for around 20 years and already has shown various functions that emerge in a neural network (NN) through RL. In this paper, they are introduced again at this timing.\n  \"Function Modularization\" approach is deeply penetrated subconsciously. The inputs and outputs for a learning system can be raw sensor signals and motor commands. \"State space\" or \"action space\" gener"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.02239","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:23Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ZFIK8wlx54YRocFrVxqbx0RhYrcC1m7jWD36YW+9E78dtGU0NuAHu+bSrM/VLqT67owXv1nS0XKgCaoR3UhFBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T07:32:43.397492Z"},"content_sha256":"2cd0808ed2facddd428546feff9b1567700cdd89dd479f30a3523158a97ae524","schema_version":"1.0","event_id":"sha256:2cd0808ed2facddd428546feff9b1567700cdd89dd479f30a3523158a97ae524"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/bundle.json","state_url":"https://pith.science/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T07:32:43Z","links":{"resolver":"https://pith.science/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP","bundle":"https://pith.science/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/bundle.json","state":"https://pith.science/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/state.json","well_known_bundle":"https://pith.science/.well-known/pith/R2EN443B4V5EKAOMJHEAJ3Q5RP/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:R2EN443B4V5EKAOMJHEAJ3Q5RP","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"47dee670c55e3764758289ff5cf3a07f86f3b4b398a18a47e9ecbcaefe576d56","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-03-07T06:51:19Z","title_canon_sha256":"aec34bd16f71e227825c0a18c01fb24c95c78423367a6b148f32a15712c6f015"},"schema_version":"1.0","source":{"id":"1703.02239","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.02239","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"arxiv_version","alias_value":"1703.02239v2","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.02239","created_at":"2026-05-18T00:44:23Z"},{"alias_kind":"pith_short_12","alias_value":"R2EN443B4V5E","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_16","alias_value":"R2EN443B4V5EKAOM","created_at":"2026-05-18T12:31:39Z"},{"alias_kind":"pith_short_8","alias_value":"R2EN443B","created_at":"2026-05-18T12:31:39Z"}],"graph_snapshots":[{"event_id":"sha256:2cd0808ed2facddd428546feff9b1567700cdd89dd479f30a3523158a97ae524","target":"graph","created_at":"2026-05-18T00:44:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Recently, triggered by the impressive results in TV-games or game of Go by Google DeepMind, end-to-end reinforcement learning (RL) is collecting attentions. Although little is known, the author's group has propounded this framework for around 20 years and already has shown various functions that emerge in a neural network (NN) through RL. In this paper, they are introduced again at this timing.\n  \"Function Modularization\" approach is deeply penetrated subconsciously. The inputs and outputs for a learning system can be raw sensor signals and motor commands. \"State space\" or \"action space\" gener","authors_text":"Katsunari Shibata","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-03-07T06:51:19Z","title":"Functions that Emerge through End-to-End Reinforcement Learning - The Direction for Artificial General Intelligence -"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.02239","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c5b19ff32e839f2a4f515d038a9e120262af094e745fb6ce60daf58e74ec77a5","target":"record","created_at":"2026-05-18T00:44:23Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"47dee670c55e3764758289ff5cf3a07f86f3b4b398a18a47e9ecbcaefe576d56","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-03-07T06:51:19Z","title_canon_sha256":"aec34bd16f71e227825c0a18c01fb24c95c78423367a6b148f32a15712c6f015"},"schema_version":"1.0","source":{"id":"1703.02239","kind":"arxiv","version":2}},"canonical_sha256":"8e88de7361e57a4501cc49c804ee1d8bc2566ca637cf7f8adc3a170b2b57d6ce","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8e88de7361e57a4501cc49c804ee1d8bc2566ca637cf7f8adc3a170b2b57d6ce","first_computed_at":"2026-05-18T00:44:23.340337Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:44:23.340337Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"20zr0ztLnoC8lfgTZp7Egow6t5qYd04bf3SPROYzORf68INkkP0NrLftTlzcYgqt38VN/QD8OqffMVArS1z9Bw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:44:23.340795Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.02239","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c5b19ff32e839f2a4f515d038a9e120262af094e745fb6ce60daf58e74ec77a5","sha256:2cd0808ed2facddd428546feff9b1567700cdd89dd479f30a3523158a97ae524"],"state_sha256":"650c645039e243940cd5d691a899f59b1916f7e65c291f2e430de919904f889a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GSIRI2ls3x5GiHWH0k19L65+VTksMOBuSucc+ZHnQdoXCSaU176m6pdkZXYfXY1G/1RzHnvztmWLa7//bK6sDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T07:32:43.401016Z","bundle_sha256":"b2ba63b21457de555e76b16ba3df9de1b237e43156a4c1e72c395020d134974a"}}