{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:EMNBOTA4B4IGDAHWVFXV2D4VUH","short_pith_number":"pith:EMNBOTA4","canonical_record":{"source":{"id":"1612.04949","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-15T07:19:46Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"28056c75ecdd9cac199d1b2313e823a6547ba0d7ab70fe8dde6eb4c8f0d667e4","abstract_canon_sha256":"3a4a2ef696ddfcf159f044ad34e7f3654bebd3967ada922e70ab9ad66a601cb4"},"schema_version":"1.0"},"canonical_sha256":"231a174c1c0f106180f6a96f5d0f95a1ebf3fb37885a03106f1ac9bd20f1be4e","source":{"kind":"arxiv","id":"1612.04949","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.04949","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"arxiv_version","alias_value":"1612.04949v1","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.04949","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"pith_short_12","alias_value":"EMNBOTA4B4IG","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_16","alias_value":"EMNBOTA4B4IGDAHW","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_8","alias_value":"EMNBOTA4","created_at":"2026-05-18T12:30:12Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:EMNBOTA4B4IGDAHWVFXV2D4VUH","target":"record","payload":{"canonical_record":{"source":{"id":"1612.04949","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-15T07:19:46Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"28056c75ecdd9cac199d1b2313e823a6547ba0d7ab70fe8dde6eb4c8f0d667e4","abstract_canon_sha256":"3a4a2ef696ddfcf159f044ad34e7f3654bebd3967ada922e70ab9ad66a601cb4"},"schema_version":"1.0"},"canonical_sha256":"231a174c1c0f106180f6a96f5d0f95a1ebf3fb37885a03106f1ac9bd20f1be4e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:54:53.829039Z","signature_b64":"+xE5J2WvaO7P+OnhIoijlo9wPxXrBWDf/FZWKsZvIr6JWY+E6vCYsqneBAYflbcXKclO54rcc07eHdLWkpfBBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"231a174c1c0f106180f6a96f5d0f95a1ebf3fb37885a03106f1ac9bd20f1be4e","last_reissued_at":"2026-05-18T00:54:53.828198Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:54:53.828198Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1612.04949","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:54:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G+lKnjOaxYhgCAM5XUuNpSBjE4nx2uYgKf7YGfGrDdMDt9wQgqjEa+zciXVtCwGp+/IdKwllXazGSmasdOGoCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T08:43:56.411584Z"},"content_sha256":"2228441916f4e74c18dc0824621012679a17482298f1266a0a4275bf47fa5ea2","schema_version":"1.0","event_id":"sha256:2228441916f4e74c18dc0824621012679a17482298f1266a0a4275bf47fa5ea2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:EMNBOTA4B4IGDAHWVFXV2D4VUH","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Recurrent Image Captioner: Describing Images with Spatial-Invariant Transformation and Attention Filtering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.CV","authors_text":"Fumin Shen, Hao Liu, Heng Tao Shen, Lixin Duan, Yang Yang","submitted_at":"2016-12-15T07:19:46Z","abstract_excerpt":"Along with the prosperity of recurrent neural network in modelling sequential data and the power of attention mechanism in automatically identify salient information, image captioning, a.k.a., image description, has been remarkably advanced in recent years. Nonetheless, most existing paradigms may suffer from the deficiency of invariance to images with different scaling, rotation, etc.; and effective integration of standalone attention to form a holistic end-to-end system. In this paper, we propose a novel image captioning architecture, termed Recurrent Image Captioner (\\textbf{RIC}), which al"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.04949","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:54:53Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RT4DSL9XyoYy3WIkW2ooscKPeDKgDzIu0kVJeFz0k4Ypj0/N66X1ugtNphVWib4mX7Hm/Tj5Ft/gcbzVkpydDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T08:43:56.412300Z"},"content_sha256":"eb7e2b88f6e2c0e926a1089cf16c3f4f70776d16c1dd1ea072c2be9c0dda7a5c","schema_version":"1.0","event_id":"sha256:eb7e2b88f6e2c0e926a1089cf16c3f4f70776d16c1dd1ea072c2be9c0dda7a5c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/bundle.json","state_url":"https://pith.science/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T08:43:56Z","links":{"resolver":"https://pith.science/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH","bundle":"https://pith.science/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/bundle.json","state":"https://pith.science/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/state.json","well_known_bundle":"https://pith.science/.well-known/pith/EMNBOTA4B4IGDAHWVFXV2D4VUH/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:EMNBOTA4B4IGDAHWVFXV2D4VUH","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3a4a2ef696ddfcf159f044ad34e7f3654bebd3967ada922e70ab9ad66a601cb4","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-15T07:19:46Z","title_canon_sha256":"28056c75ecdd9cac199d1b2313e823a6547ba0d7ab70fe8dde6eb4c8f0d667e4"},"schema_version":"1.0","source":{"id":"1612.04949","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.04949","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"arxiv_version","alias_value":"1612.04949v1","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.04949","created_at":"2026-05-18T00:54:53Z"},{"alias_kind":"pith_short_12","alias_value":"EMNBOTA4B4IG","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_16","alias_value":"EMNBOTA4B4IGDAHW","created_at":"2026-05-18T12:30:12Z"},{"alias_kind":"pith_short_8","alias_value":"EMNBOTA4","created_at":"2026-05-18T12:30:12Z"}],"graph_snapshots":[{"event_id":"sha256:eb7e2b88f6e2c0e926a1089cf16c3f4f70776d16c1dd1ea072c2be9c0dda7a5c","target":"graph","created_at":"2026-05-18T00:54:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Along with the prosperity of recurrent neural network in modelling sequential data and the power of attention mechanism in automatically identify salient information, image captioning, a.k.a., image description, has been remarkably advanced in recent years. Nonetheless, most existing paradigms may suffer from the deficiency of invariance to images with different scaling, rotation, etc.; and effective integration of standalone attention to form a holistic end-to-end system. In this paper, we propose a novel image captioning architecture, termed Recurrent Image Captioner (\\textbf{RIC}), which al","authors_text":"Fumin Shen, Hao Liu, Heng Tao Shen, Lixin Duan, Yang Yang","cross_cats":["cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-15T07:19:46Z","title":"Recurrent Image Captioner: Describing Images with Spatial-Invariant Transformation and Attention Filtering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.04949","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:2228441916f4e74c18dc0824621012679a17482298f1266a0a4275bf47fa5ea2","target":"record","created_at":"2026-05-18T00:54:53Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3a4a2ef696ddfcf159f044ad34e7f3654bebd3967ada922e70ab9ad66a601cb4","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-15T07:19:46Z","title_canon_sha256":"28056c75ecdd9cac199d1b2313e823a6547ba0d7ab70fe8dde6eb4c8f0d667e4"},"schema_version":"1.0","source":{"id":"1612.04949","kind":"arxiv","version":1}},"canonical_sha256":"231a174c1c0f106180f6a96f5d0f95a1ebf3fb37885a03106f1ac9bd20f1be4e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"231a174c1c0f106180f6a96f5d0f95a1ebf3fb37885a03106f1ac9bd20f1be4e","first_computed_at":"2026-05-18T00:54:53.828198Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:54:53.828198Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+xE5J2WvaO7P+OnhIoijlo9wPxXrBWDf/FZWKsZvIr6JWY+E6vCYsqneBAYflbcXKclO54rcc07eHdLWkpfBBw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:54:53.829039Z","signed_message":"canonical_sha256_bytes"},"source_id":"1612.04949","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:2228441916f4e74c18dc0824621012679a17482298f1266a0a4275bf47fa5ea2","sha256:eb7e2b88f6e2c0e926a1089cf16c3f4f70776d16c1dd1ea072c2be9c0dda7a5c"],"state_sha256":"450d60a3d434a383951235622e298b9883af6f10dd6bb28622204049ea91d3b2"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WIJx2Q+zJqAfUFOBy0E/yBh6Uj+Bvzsz8Edx2fmuPXgVUKWJRo8SHUdNVMBvlf8o7ymxUy6efVb3J76MORU/Ag==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T08:43:56.415632Z","bundle_sha256":"8b019453c14dcbaaad606558bf736177b3fd805f9b12c97d9b46647e9dafb8a0"}}