{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:VL6XSQFLDP6KRO5BOTLSWMQ5KA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ca02d193660e126540f2aa3a3930e7d5d6350913f847b35f8dbfac440530ee25","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-16T13:37:45Z","title_canon_sha256":"39667f4c234b2018bd8a8164e0ddefe8f6866e83feb78ae2ed02334c34a49742"},"schema_version":"1.0","source":{"id":"1809.05872","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.05872","created_at":"2026-05-18T00:05:36Z"},{"alias_kind":"arxiv_version","alias_value":"1809.05872v1","created_at":"2026-05-18T00:05:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.05872","created_at":"2026-05-18T00:05:36Z"},{"alias_kind":"pith_short_12","alias_value":"VL6XSQFLDP6K","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_16","alias_value":"VL6XSQFLDP6KRO5B","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_8","alias_value":"VL6XSQFL","created_at":"2026-05-18T12:32:59Z"}],"graph_snapshots":[{"event_id":"sha256:91cfd33f4aec0aee837b44c7f132a7bfb4c9c8b8425bce40af660da2d0db6683","target":"graph","created_at":"2026-05-18T00:05:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Current imitation learning techniques are too restrictive because they require the agent and expert to share the same action space. However, oftentimes agents that act differently from the expert can solve the task just as good. For example, a person lifting a box can be imitated by a ceiling mounted robot or a desktop-based robotic-arm. In both cases, the end goal of lifting the box is achieved, perhaps using different strategies. We denote this setup as \\textit{Inspiration Learning} - knowledge transfer between agents that operate in different action spaces. Since state-action expert demonst","authors_text":"Nir Baram, Shie Mannor","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-16T13:37:45Z","title":"Inspiration Learning through Preferences"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.05872","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3b34c1e1b4f063892578e4db47a7c6c4dc48924d81e659d30001fbbbd369c46c","target":"record","created_at":"2026-05-18T00:05:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ca02d193660e126540f2aa3a3930e7d5d6350913f847b35f8dbfac440530ee25","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-16T13:37:45Z","title_canon_sha256":"39667f4c234b2018bd8a8164e0ddefe8f6866e83feb78ae2ed02334c34a49742"},"schema_version":"1.0","source":{"id":"1809.05872","kind":"arxiv","version":1}},"canonical_sha256":"aafd7940ab1bfca8bba174d72b321d5025eb7312a4d5ff5932ee69580e17e062","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"aafd7940ab1bfca8bba174d72b321d5025eb7312a4d5ff5932ee69580e17e062","first_computed_at":"2026-05-18T00:05:36.252340Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:36.252340Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"j9flp+iyKp4/tkDghgX9JomS4xe1IhDhp0FuDCECJqEaCLRyLVDJtuf4KYZ8CbtzjyACflMBLoua0/sGWTrBCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:36.252806Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.05872","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3b34c1e1b4f063892578e4db47a7c6c4dc48924d81e659d30001fbbbd369c46c","sha256:91cfd33f4aec0aee837b44c7f132a7bfb4c9c8b8425bce40af660da2d0db6683"],"state_sha256":"9bd0b073a7904ed5c9611f0f5cd8d860a8a425cded492b8907aac68106068c2e"}