{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:3KG7BQQY5E5OTE5KRLOBZHUD3V","short_pith_number":"pith:3KG7BQQY","canonical_record":{"source":{"id":"1805.08010","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-21T12:15:34Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"478e1b63d277c1a150a7266a4243d4d137e3167aa906b6867f70f195d5959a36","abstract_canon_sha256":"4202523564616cd6983a94f42e1abd8f87d524d08ce20d2cd9d92c299f7a835d"},"schema_version":"1.0"},"canonical_sha256":"da8df0c218e93ae993aa8adc1c9e83dd4f1232ef8d4a23f26adbab3a6d292f01","source":{"kind":"arxiv","id":"1805.08010","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.08010","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"arxiv_version","alias_value":"1805.08010v4","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.08010","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"pith_short_12","alias_value":"3KG7BQQY5E5O","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3KG7BQQY5E5OTE5K","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3KG7BQQY","created_at":"2026-05-18T12:32:02Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:3KG7BQQY5E5OTE5KRLOBZHUD3V","target":"record","payload":{"canonical_record":{"source":{"id":"1805.08010","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-21T12:15:34Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"478e1b63d277c1a150a7266a4243d4d137e3167aa906b6867f70f195d5959a36","abstract_canon_sha256":"4202523564616cd6983a94f42e1abd8f87d524d08ce20d2cd9d92c299f7a835d"},"schema_version":"1.0"},"canonical_sha256":"da8df0c218e93ae993aa8adc1c9e83dd4f1232ef8d4a23f26adbab3a6d292f01","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:53.370644Z","signature_b64":"kHNQl0kaVlrcZQRb+p2//R4SyMSJ47M/aiujhPqSrEz1iBmGvqOxXJ+VJKtZJLszu8uO9n1Dq2HH9+duBkP7Cg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"da8df0c218e93ae993aa8adc1c9e83dd4f1232ef8d4a23f26adbab3a6d292f01","last_reissued_at":"2026-05-17T23:56:53.369871Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:53.369871Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1805.08010","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IIXz0ANWfy7XMPBb0VmRGzJ6jCQ9uq1Wjx3jXsWUJaWL3Qn6otRIden2OZge4kBVutcOEKrsMxd7H+po9ZeWDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T06:05:00.359650Z"},"content_sha256":"ad3109e00120ff01365b394f3a352a2a727ce73e8b11c10c6cfadd123ffcd504","schema_version":"1.0","event_id":"sha256:ad3109e00120ff01365b394f3a352a2a727ce73e8b11c10c6cfadd123ffcd504"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:3KG7BQQY5E5OTE5KRLOBZHUD3V","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Where Do You Think You're Going?: Inferring Beliefs about Dynamics from Behavior","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Anca D. Dragan, Sergey Levine, Siddharth Reddy","submitted_at":"2018-05-21T12:15:34Z","abstract_excerpt":"Inferring intent from observed behavior has been studied extensively within the frameworks of Bayesian inverse planning and inverse reinforcement learning. These methods infer a goal or reward function that best explains the actions of the observed agent, typically a human demonstrator. Another agent can use this inferred intent to predict, imitate, or assist the human user. However, a central assumption in inverse reinforcement learning is that the demonstrator is close to optimal. While models of suboptimal behavior exist, they typically assume that suboptimal actions are the result of some "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.08010","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P6INv1ORqsrGwhPKNXNc1W1d3Xiyu85nHhKi0wVzbHZOfjq8gejk+mG7AZWSX3AivcXvpl2YF/pp1uoYNZVyBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T06:05:00.360447Z"},"content_sha256":"c3d2da2d802b49f524dfd81dec49ddb85e8ca998b070e5da8ca49492096cb5fa","schema_version":"1.0","event_id":"sha256:c3d2da2d802b49f524dfd81dec49ddb85e8ca998b070e5da8ca49492096cb5fa"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/bundle.json","state_url":"https://pith.science/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T06:05:00Z","links":{"resolver":"https://pith.science/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V","bundle":"https://pith.science/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/bundle.json","state":"https://pith.science/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3KG7BQQY5E5OTE5KRLOBZHUD3V/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:3KG7BQQY5E5OTE5KRLOBZHUD3V","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4202523564616cd6983a94f42e1abd8f87d524d08ce20d2cd9d92c299f7a835d","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-21T12:15:34Z","title_canon_sha256":"478e1b63d277c1a150a7266a4243d4d137e3167aa906b6867f70f195d5959a36"},"schema_version":"1.0","source":{"id":"1805.08010","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.08010","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"arxiv_version","alias_value":"1805.08010v4","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.08010","created_at":"2026-05-17T23:56:53Z"},{"alias_kind":"pith_short_12","alias_value":"3KG7BQQY5E5O","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3KG7BQQY5E5OTE5K","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3KG7BQQY","created_at":"2026-05-18T12:32:02Z"}],"graph_snapshots":[{"event_id":"sha256:c3d2da2d802b49f524dfd81dec49ddb85e8ca998b070e5da8ca49492096cb5fa","target":"graph","created_at":"2026-05-17T23:56:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Inferring intent from observed behavior has been studied extensively within the frameworks of Bayesian inverse planning and inverse reinforcement learning. These methods infer a goal or reward function that best explains the actions of the observed agent, typically a human demonstrator. Another agent can use this inferred intent to predict, imitate, or assist the human user. However, a central assumption in inverse reinforcement learning is that the demonstrator is close to optimal. While models of suboptimal behavior exist, they typically assume that suboptimal actions are the result of some ","authors_text":"Anca D. Dragan, Sergey Levine, Siddharth Reddy","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-21T12:15:34Z","title":"Where Do You Think You're Going?: Inferring Beliefs about Dynamics from Behavior"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.08010","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ad3109e00120ff01365b394f3a352a2a727ce73e8b11c10c6cfadd123ffcd504","target":"record","created_at":"2026-05-17T23:56:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4202523564616cd6983a94f42e1abd8f87d524d08ce20d2cd9d92c299f7a835d","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-21T12:15:34Z","title_canon_sha256":"478e1b63d277c1a150a7266a4243d4d137e3167aa906b6867f70f195d5959a36"},"schema_version":"1.0","source":{"id":"1805.08010","kind":"arxiv","version":4}},"canonical_sha256":"da8df0c218e93ae993aa8adc1c9e83dd4f1232ef8d4a23f26adbab3a6d292f01","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"da8df0c218e93ae993aa8adc1c9e83dd4f1232ef8d4a23f26adbab3a6d292f01","first_computed_at":"2026-05-17T23:56:53.369871Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:56:53.369871Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"kHNQl0kaVlrcZQRb+p2//R4SyMSJ47M/aiujhPqSrEz1iBmGvqOxXJ+VJKtZJLszu8uO9n1Dq2HH9+duBkP7Cg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:56:53.370644Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.08010","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ad3109e00120ff01365b394f3a352a2a727ce73e8b11c10c6cfadd123ffcd504","sha256:c3d2da2d802b49f524dfd81dec49ddb85e8ca998b070e5da8ca49492096cb5fa"],"state_sha256":"b6fd17f81fd032d32beb72681b69a04278f2e98114631ed512695a90175c554a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lBgpk1lJIXyJ6hWqGz1hfxe4uS1lQtAQAcviXRiNR7tzKsp1LG9qC7AMEph/JglbpSzaNzeQ6EknuslZfOKKDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T06:05:00.364628Z","bundle_sha256":"1e211dcafdcbbeb82df93a8c6c9775ccafa0d358721e51488f6d4e41af7da9f8"}}