{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:HABAAGMK4VS3JVJRXIMM4JY76D","short_pith_number":"pith:HABAAGMK","canonical_record":{"source":{"id":"2605.24352","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-23T02:26:46Z","cross_cats_sorted":[],"title_canon_sha256":"4ba971e708c88c38d5a9c24629ee759587714b71089ce69f323f90e37b40197c","abstract_canon_sha256":"066bb27660440e25b7c09d774493968e5bc9a7d8ad8e47ed8c8a323555261fc5"},"schema_version":"1.0"},"canonical_sha256":"380200198ae565b4d531ba18ce271ff0f4c4f3ddadc0577882552a8e82272453","source":{"kind":"arxiv","id":"2605.24352","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.24352","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"arxiv_version","alias_value":"2605.24352v1","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.24352","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_12","alias_value":"HABAAGMK4VS3","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_16","alias_value":"HABAAGMK4VS3JVJR","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_8","alias_value":"HABAAGMK","created_at":"2026-05-26T01:03:01Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:HABAAGMK4VS3JVJRXIMM4JY76D","target":"record","payload":{"canonical_record":{"source":{"id":"2605.24352","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-23T02:26:46Z","cross_cats_sorted":[],"title_canon_sha256":"4ba971e708c88c38d5a9c24629ee759587714b71089ce69f323f90e37b40197c","abstract_canon_sha256":"066bb27660440e25b7c09d774493968e5bc9a7d8ad8e47ed8c8a323555261fc5"},"schema_version":"1.0"},"canonical_sha256":"380200198ae565b4d531ba18ce271ff0f4c4f3ddadc0577882552a8e82272453","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T01:03:01.389887Z","signature_b64":"k0zgOo+kNLrY44zK4V0mcMCh5wT5uI84MkBFlXGixNFbaoo3Qf1ttaVZTHZ2PGPODVOO6NhnxbKJhCeAnLJoBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"380200198ae565b4d531ba18ce271ff0f4c4f3ddadc0577882552a8e82272453","last_reissued_at":"2026-05-26T01:03:01.389139Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T01:03:01.389139Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.24352","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:03:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sigq9LcXY6leMgqZeNMTI42K0mieydd++zuus8sIaQCh7BW+2QtV679cFZWVTGJ0KifOGjE12sd3lH1ut8keCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T04:08:59.753199Z"},"content_sha256":"b3fc188e4d4617d36f06d467573b29a8003cf1cb7b512170a4b15d402a7a26ee","schema_version":"1.0","event_id":"sha256:b3fc188e4d4617d36f06d467573b29a8003cf1cb7b512170a4b15d402a7a26ee"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:HABAAGMK4VS3JVJRXIMM4JY76D","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Partner-Aware Hierarchical Skill Discovery for Robust Human-AI Collaboration","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Adnan Ahmad, Bahareh Nakisa, Mohammad Naim Rastgoo","submitted_at":"2026-05-23T02:26:46Z","abstract_excerpt":"Multi-agent collaboration, especially in human-AI teaming, requires agents that can adapt to novel partners with diverse and dynamic behaviors. Conventional Deep Hierarchical Reinforcement Learning (DHRL) methods focus on agent-centric rewards and overlook partner behavior, leading to shortcut learning, where skills exploit spurious information instead of adapting to partners' dynamic behaviors. This limitation undermines agents' ability to adapt and coordinate effectively with novel partners. We introduce Partner-Aware Skill Discovery (PASD), a DHRL framework that learns skills conditioned on"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.24352","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.24352/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T01:03:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xA5C6sRg99xIAYYKs8ZBY8Q29szrnboO/5au87/1qNSiwvxMMDSl5bj5Mp+4eXl6U7ZW4AwnmEqoXWF/79GfCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T04:08:59.753614Z"},"content_sha256":"efdc0be13358d5dec220b994ed47f8a807cc38dd3ff03752d6988efe1d1d0328","schema_version":"1.0","event_id":"sha256:efdc0be13358d5dec220b994ed47f8a807cc38dd3ff03752d6988efe1d1d0328"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/HABAAGMK4VS3JVJRXIMM4JY76D/bundle.json","state_url":"https://pith.science/pith/HABAAGMK4VS3JVJRXIMM4JY76D/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/HABAAGMK4VS3JVJRXIMM4JY76D/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-01T04:08:59Z","links":{"resolver":"https://pith.science/pith/HABAAGMK4VS3JVJRXIMM4JY76D","bundle":"https://pith.science/pith/HABAAGMK4VS3JVJRXIMM4JY76D/bundle.json","state":"https://pith.science/pith/HABAAGMK4VS3JVJRXIMM4JY76D/state.json","well_known_bundle":"https://pith.science/.well-known/pith/HABAAGMK4VS3JVJRXIMM4JY76D/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:HABAAGMK4VS3JVJRXIMM4JY76D","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"066bb27660440e25b7c09d774493968e5bc9a7d8ad8e47ed8c8a323555261fc5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-23T02:26:46Z","title_canon_sha256":"4ba971e708c88c38d5a9c24629ee759587714b71089ce69f323f90e37b40197c"},"schema_version":"1.0","source":{"id":"2605.24352","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.24352","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"arxiv_version","alias_value":"2605.24352v1","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.24352","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_12","alias_value":"HABAAGMK4VS3","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_16","alias_value":"HABAAGMK4VS3JVJR","created_at":"2026-05-26T01:03:01Z"},{"alias_kind":"pith_short_8","alias_value":"HABAAGMK","created_at":"2026-05-26T01:03:01Z"}],"graph_snapshots":[{"event_id":"sha256:efdc0be13358d5dec220b994ed47f8a807cc38dd3ff03752d6988efe1d1d0328","target":"graph","created_at":"2026-05-26T01:03:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.24352/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Multi-agent collaboration, especially in human-AI teaming, requires agents that can adapt to novel partners with diverse and dynamic behaviors. Conventional Deep Hierarchical Reinforcement Learning (DHRL) methods focus on agent-centric rewards and overlook partner behavior, leading to shortcut learning, where skills exploit spurious information instead of adapting to partners' dynamic behaviors. This limitation undermines agents' ability to adapt and coordinate effectively with novel partners. We introduce Partner-Aware Skill Discovery (PASD), a DHRL framework that learns skills conditioned on","authors_text":"Adnan Ahmad, Bahareh Nakisa, Mohammad Naim Rastgoo","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-23T02:26:46Z","title":"Partner-Aware Hierarchical Skill Discovery for Robust Human-AI Collaboration"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.24352","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b3fc188e4d4617d36f06d467573b29a8003cf1cb7b512170a4b15d402a7a26ee","target":"record","created_at":"2026-05-26T01:03:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"066bb27660440e25b7c09d774493968e5bc9a7d8ad8e47ed8c8a323555261fc5","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-23T02:26:46Z","title_canon_sha256":"4ba971e708c88c38d5a9c24629ee759587714b71089ce69f323f90e37b40197c"},"schema_version":"1.0","source":{"id":"2605.24352","kind":"arxiv","version":1}},"canonical_sha256":"380200198ae565b4d531ba18ce271ff0f4c4f3ddadc0577882552a8e82272453","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"380200198ae565b4d531ba18ce271ff0f4c4f3ddadc0577882552a8e82272453","first_computed_at":"2026-05-26T01:03:01.389139Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T01:03:01.389139Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"k0zgOo+kNLrY44zK4V0mcMCh5wT5uI84MkBFlXGixNFbaoo3Qf1ttaVZTHZ2PGPODVOO6NhnxbKJhCeAnLJoBw==","signature_status":"signed_v1","signed_at":"2026-05-26T01:03:01.389887Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.24352","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b3fc188e4d4617d36f06d467573b29a8003cf1cb7b512170a4b15d402a7a26ee","sha256:efdc0be13358d5dec220b994ed47f8a807cc38dd3ff03752d6988efe1d1d0328"],"state_sha256":"d8b98996c21a4407f96d4a0f8ef33444c5d7b21f12ff5785be78aa1d810e641d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6vgW1mvKDlmW2cxGry5yIuGTNv3Ylel76cdoUSjmOCjgz2IpTuFGZs8efroYCxL3n11V2J8b04M0cMmgF+bHBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-01T04:08:59.755700Z","bundle_sha256":"45051c4a0e397c3ff7fe4e5b4983a17a4363a63d4a72b3c85660d96593eecdb2"}}