{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:GD4QKSRHCUZSSC23IIUPXGZUW2","short_pith_number":"pith:GD4QKSRH","canonical_record":{"source":{"id":"2605.28127","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T08:17:01Z","cross_cats_sorted":[],"title_canon_sha256":"cfd5be0d28e4fa5f6453e860628632e11822851d6cd4afe6109f403715602807","abstract_canon_sha256":"689f3ab6bc39224b497738a3391fd8ec7855b30752db63aff993aba268ed9d01"},"schema_version":"1.0"},"canonical_sha256":"30f9054a271533290b5b4228fb9b34b6a395a16a8e1d8c060ee82cfd2c1e978e","source":{"kind":"arxiv","id":"2605.28127","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.28127","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"arxiv_version","alias_value":"2605.28127v1","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28127","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_12","alias_value":"GD4QKSRHCUZS","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_16","alias_value":"GD4QKSRHCUZSSC23","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_8","alias_value":"GD4QKSRH","created_at":"2026-05-28T01:04:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:GD4QKSRHCUZSSC23IIUPXGZUW2","target":"record","payload":{"canonical_record":{"source":{"id":"2605.28127","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T08:17:01Z","cross_cats_sorted":[],"title_canon_sha256":"cfd5be0d28e4fa5f6453e860628632e11822851d6cd4afe6109f403715602807","abstract_canon_sha256":"689f3ab6bc39224b497738a3391fd8ec7855b30752db63aff993aba268ed9d01"},"schema_version":"1.0"},"canonical_sha256":"30f9054a271533290b5b4228fb9b34b6a395a16a8e1d8c060ee82cfd2c1e978e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-28T01:04:59.873278Z","signature_b64":"IJyKU5Mi8c7qobE1zYuYUmLja6AGTeeBoQozPT5B1km1aSRt6IZvgUaS/AHYJJCQBPezIEBtAbe5ztF6ReSlBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"30f9054a271533290b5b4228fb9b34b6a395a16a8e1d8c060ee82cfd2c1e978e","last_reissued_at":"2026-05-28T01:04:59.872850Z","signature_status":"signed_v1","first_computed_at":"2026-05-28T01:04:59.872850Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.28127","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-28T01:04:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2yug31L0GgBpqNLLGIG9JVACwns3x0835Sl+XhftIicGMjNFxS6x3/1hld2Wf8GAT15e77RFfbLDgI7cKGNICA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T06:30:56.159010Z"},"content_sha256":"3137bdde5a87de6b232d4535c6ccf96acbc6d331cf569ab417e37ee597332a09","schema_version":"1.0","event_id":"sha256:3137bdde5a87de6b232d4535c6ccf96acbc6d331cf569ab417e37ee597332a09"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:GD4QKSRHCUZSSC23IIUPXGZUW2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Adaptive Coarse-to-Fine Subgoal Refinement for Long-Horizon Offline Goal-Conditioned Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Chao Yu, Chengdong Xu, Kaiqiang Ke, Shenghong He, Xiangyuan Lan, Yuheng Luo","submitted_at":"2026-05-27T08:17:01Z","abstract_excerpt":"Offline goal-conditioned reinforcement learning (GCRL) is challenging in long-horizon tasks, where distant state--goal pairs provide weak supervision and value estimates become vulnerable to accumulated bootstrapping errors. Hierarchical methods mitigate this difficulty by introducing intermediate subgoals, but fixed temporal abstractions or fixed hierarchy depths can be mismatched to state--goal pairs with different reachability horizons. We propose Coarse-to-Fine Hierarchical Goal Reinforcement Learning (CFHRL), a fully offline GCRL framework that adaptively refines distant goals before exec"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28127","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.28127/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-28T01:04:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"nz+ghWbaZtO4WHb+tELQwzMabqzHN9XEavVjO5Lg+8WhogkJD3Ru9QXQVfScA/6nQv55XHQKKTnwtYolHY1dAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T06:30:56.159642Z"},"content_sha256":"6ae8c37130a85e1042d049bcb1c9ed1d817cbb4c7eb1d470930f549648d297e5","schema_version":"1.0","event_id":"sha256:6ae8c37130a85e1042d049bcb1c9ed1d817cbb4c7eb1d470930f549648d297e5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/bundle.json","state_url":"https://pith.science/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T06:30:56Z","links":{"resolver":"https://pith.science/pith/GD4QKSRHCUZSSC23IIUPXGZUW2","bundle":"https://pith.science/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/bundle.json","state":"https://pith.science/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GD4QKSRHCUZSSC23IIUPXGZUW2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:GD4QKSRHCUZSSC23IIUPXGZUW2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"689f3ab6bc39224b497738a3391fd8ec7855b30752db63aff993aba268ed9d01","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T08:17:01Z","title_canon_sha256":"cfd5be0d28e4fa5f6453e860628632e11822851d6cd4afe6109f403715602807"},"schema_version":"1.0","source":{"id":"2605.28127","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.28127","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"arxiv_version","alias_value":"2605.28127v1","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.28127","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_12","alias_value":"GD4QKSRHCUZS","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_16","alias_value":"GD4QKSRHCUZSSC23","created_at":"2026-05-28T01:04:59Z"},{"alias_kind":"pith_short_8","alias_value":"GD4QKSRH","created_at":"2026-05-28T01:04:59Z"}],"graph_snapshots":[{"event_id":"sha256:6ae8c37130a85e1042d049bcb1c9ed1d817cbb4c7eb1d470930f549648d297e5","target":"graph","created_at":"2026-05-28T01:04:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.28127/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Offline goal-conditioned reinforcement learning (GCRL) is challenging in long-horizon tasks, where distant state--goal pairs provide weak supervision and value estimates become vulnerable to accumulated bootstrapping errors. Hierarchical methods mitigate this difficulty by introducing intermediate subgoals, but fixed temporal abstractions or fixed hierarchy depths can be mismatched to state--goal pairs with different reachability horizons. We propose Coarse-to-Fine Hierarchical Goal Reinforcement Learning (CFHRL), a fully offline GCRL framework that adaptively refines distant goals before exec","authors_text":"Chao Yu, Chengdong Xu, Kaiqiang Ke, Shenghong He, Xiangyuan Lan, Yuheng Luo","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T08:17:01Z","title":"Adaptive Coarse-to-Fine Subgoal Refinement for Long-Horizon Offline Goal-Conditioned Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.28127","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3137bdde5a87de6b232d4535c6ccf96acbc6d331cf569ab417e37ee597332a09","target":"record","created_at":"2026-05-28T01:04:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"689f3ab6bc39224b497738a3391fd8ec7855b30752db63aff993aba268ed9d01","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-27T08:17:01Z","title_canon_sha256":"cfd5be0d28e4fa5f6453e860628632e11822851d6cd4afe6109f403715602807"},"schema_version":"1.0","source":{"id":"2605.28127","kind":"arxiv","version":1}},"canonical_sha256":"30f9054a271533290b5b4228fb9b34b6a395a16a8e1d8c060ee82cfd2c1e978e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"30f9054a271533290b5b4228fb9b34b6a395a16a8e1d8c060ee82cfd2c1e978e","first_computed_at":"2026-05-28T01:04:59.872850Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-28T01:04:59.872850Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"IJyKU5Mi8c7qobE1zYuYUmLja6AGTeeBoQozPT5B1km1aSRt6IZvgUaS/AHYJJCQBPezIEBtAbe5ztF6ReSlBw==","signature_status":"signed_v1","signed_at":"2026-05-28T01:04:59.873278Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.28127","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3137bdde5a87de6b232d4535c6ccf96acbc6d331cf569ab417e37ee597332a09","sha256:6ae8c37130a85e1042d049bcb1c9ed1d817cbb4c7eb1d470930f549648d297e5"],"state_sha256":"1a882c13adc437dcf538ead47e0f1327202fbf16d0c38757be8d4b021c8e64b3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6drclnTlN+xAm32DqYLaseQT4QG/Cn2aNYvkNKKwuXFwPN3snhR+5p/kYqHXRxDHduA9KH5rgwlmglR/tVUrDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T06:30:56.162948Z","bundle_sha256":"8ca7309f3c67b2ff81fcf84fb9f1eb4a10e8364cd4469ac0aea598ddcaf2a01c"}}