{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:WR74KRM3LLNY65HWUJ6GK76KJ5","short_pith_number":"pith:WR74KRM3","canonical_record":{"source":{"id":"1705.10561","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2017-05-30T11:44:50Z","cross_cats_sorted":[],"title_canon_sha256":"81135855d2f91ff45a61cb513623467bc0fed6022cae215d13cdee1e928a913a","abstract_canon_sha256":"62e858131f8a5dab1e9257905c65103e0d900f84dc877382b62a27265065512f"},"schema_version":"1.0"},"canonical_sha256":"b47fc5459b5adb8f74f6a27c657fca4f7b69fa54dd973265b0a78afa084beff3","source":{"kind":"arxiv","id":"1705.10561","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.10561","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"arxiv_version","alias_value":"1705.10561v3","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.10561","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"pith_short_12","alias_value":"WR74KRM3LLNY","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"WR74KRM3LLNY65HW","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"WR74KRM3","created_at":"2026-05-18T12:31:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:WR74KRM3LLNY65HWUJ6GK76KJ5","target":"record","payload":{"canonical_record":{"source":{"id":"1705.10561","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2017-05-30T11:44:50Z","cross_cats_sorted":[],"title_canon_sha256":"81135855d2f91ff45a61cb513623467bc0fed6022cae215d13cdee1e928a913a","abstract_canon_sha256":"62e858131f8a5dab1e9257905c65103e0d900f84dc877382b62a27265065512f"},"schema_version":"1.0"},"canonical_sha256":"b47fc5459b5adb8f74f6a27c657fca4f7b69fa54dd973265b0a78afa084beff3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:14:28.961375Z","signature_b64":"C0k68T2ntT/z8++p9mOePTNwvs4VAvDFAECBiKVdvjKz9yRgZ6VpChLE2Li78e7x6i4EZrYXR2DTvfEEevMbCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b47fc5459b5adb8f74f6a27c657fca4f7b69fa54dd973265b0a78afa084beff3","last_reissued_at":"2026-05-18T00:14:28.960694Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:14:28.960694Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1705.10561","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:14:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"t8dxzbV0AT7eNKbdeHq0NF0kbFnx8/HrMQ/oSKMSTWhLW3wEX9NzEosavj0fpePvJEmcMoUcae8RH14b46VoAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T14:48:45.546903Z"},"content_sha256":"2beffbb96fde870c6e4803efba25e65bd583814d016fbb8c86304a0419201ecb","schema_version":"1.0","event_id":"sha256:2beffbb96fde870c6e4803efba25e65bd583814d016fbb8c86304a0419201ecb"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:WR74KRM3LLNY65HWUJ6GK76KJ5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"End-to-end Active Object Tracking via Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Fangwei Zhong, Peng Sun, Tong Zhang, Wei Liu, Wenhan Luo, Yizhou Wang","submitted_at":"2017-05-30T11:44:50Z","abstract_excerpt":"We study active object tracking, where a tracker takes as input the visual observation (i.e., frame sequence) and produces the camera control signal (e.g., move forward, turn left, etc.). Conventional methods tackle the tracking and the camera control separately, which is challenging to tune jointly. It also incurs many human efforts for labeling and many expensive trial-and-errors in realworld. To address these issues, we propose, in this paper, an end-to-end solution via deep reinforcement learning, where a ConvNet-LSTM function approximator is adopted for the direct frame-toaction predictio"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.10561","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:14:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"j/8gSXzPKdLoTplULum1was47N01AJDJk5/57S5qKnJ31nL7sd8ApyumODeETPOy3e51/2Srlh2CtXryVSiJAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T14:48:45.547240Z"},"content_sha256":"3597939601e279dbcf97e2abf44e043ecb515a1f96106a671ba03d0520e21e09","schema_version":"1.0","event_id":"sha256:3597939601e279dbcf97e2abf44e043ecb515a1f96106a671ba03d0520e21e09"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/bundle.json","state_url":"https://pith.science/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T14:48:45Z","links":{"resolver":"https://pith.science/pith/WR74KRM3LLNY65HWUJ6GK76KJ5","bundle":"https://pith.science/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/bundle.json","state":"https://pith.science/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WR74KRM3LLNY65HWUJ6GK76KJ5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:WR74KRM3LLNY65HWUJ6GK76KJ5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"62e858131f8a5dab1e9257905c65103e0d900f84dc877382b62a27265065512f","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2017-05-30T11:44:50Z","title_canon_sha256":"81135855d2f91ff45a61cb513623467bc0fed6022cae215d13cdee1e928a913a"},"schema_version":"1.0","source":{"id":"1705.10561","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1705.10561","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"arxiv_version","alias_value":"1705.10561v3","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1705.10561","created_at":"2026-05-18T00:14:28Z"},{"alias_kind":"pith_short_12","alias_value":"WR74KRM3LLNY","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_16","alias_value":"WR74KRM3LLNY65HW","created_at":"2026-05-18T12:31:53Z"},{"alias_kind":"pith_short_8","alias_value":"WR74KRM3","created_at":"2026-05-18T12:31:53Z"}],"graph_snapshots":[{"event_id":"sha256:3597939601e279dbcf97e2abf44e043ecb515a1f96106a671ba03d0520e21e09","target":"graph","created_at":"2026-05-18T00:14:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We study active object tracking, where a tracker takes as input the visual observation (i.e., frame sequence) and produces the camera control signal (e.g., move forward, turn left, etc.). Conventional methods tackle the tracking and the camera control separately, which is challenging to tune jointly. It also incurs many human efforts for labeling and many expensive trial-and-errors in realworld. To address these issues, we propose, in this paper, an end-to-end solution via deep reinforcement learning, where a ConvNet-LSTM function approximator is adopted for the direct frame-toaction predictio","authors_text":"Fangwei Zhong, Peng Sun, Tong Zhang, Wei Liu, Wenhan Luo, Yizhou Wang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2017-05-30T11:44:50Z","title":"End-to-end Active Object Tracking via Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1705.10561","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2beffbb96fde870c6e4803efba25e65bd583814d016fbb8c86304a0419201ecb","target":"record","created_at":"2026-05-18T00:14:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"62e858131f8a5dab1e9257905c65103e0d900f84dc877382b62a27265065512f","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2017-05-30T11:44:50Z","title_canon_sha256":"81135855d2f91ff45a61cb513623467bc0fed6022cae215d13cdee1e928a913a"},"schema_version":"1.0","source":{"id":"1705.10561","kind":"arxiv","version":3}},"canonical_sha256":"b47fc5459b5adb8f74f6a27c657fca4f7b69fa54dd973265b0a78afa084beff3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b47fc5459b5adb8f74f6a27c657fca4f7b69fa54dd973265b0a78afa084beff3","first_computed_at":"2026-05-18T00:14:28.960694Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:14:28.960694Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"C0k68T2ntT/z8++p9mOePTNwvs4VAvDFAECBiKVdvjKz9yRgZ6VpChLE2Li78e7x6i4EZrYXR2DTvfEEevMbCQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:14:28.961375Z","signed_message":"canonical_sha256_bytes"},"source_id":"1705.10561","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2beffbb96fde870c6e4803efba25e65bd583814d016fbb8c86304a0419201ecb","sha256:3597939601e279dbcf97e2abf44e043ecb515a1f96106a671ba03d0520e21e09"],"state_sha256":"12c1a0bef5bd21ca4b072b203af3762d4fb0936d41261a0934f159a55fcbe985"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OHCLl7mpyWpT4E6EDTVcRaSYd5Hh+s3OSwedezc2VhEflHpivlb2nPfg/y8uubvQK4KM8pjB+DxL3MuHzEJqAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T14:48:45.549116Z","bundle_sha256":"c48c1046cd121de08fa8a94fe1d6a81f13e79846da79775282753cb19e731022"}}