{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:6Z26G3SYNS6RX4ZBKHFAXF75A4","short_pith_number":"pith:6Z26G3SY","canonical_record":{"source":{"id":"1611.05321","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-11-16T15:33:12Z","cross_cats_sorted":[],"title_canon_sha256":"df7d24f7789c1aabf7bedd85e37aa16066d21a04a8d9928c53784e2b23767d8f","abstract_canon_sha256":"90002e8b80a175bd58f3a3326cdb3de886b05a42a5b559e81df94fbe0abd6889"},"schema_version":"1.0"},"canonical_sha256":"f675e36e586cbd1bf32151ca0b97fd07238ebee03258530a5974572b9033e51e","source":{"kind":"arxiv","id":"1611.05321","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.05321","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"arxiv_version","alias_value":"1611.05321v3","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.05321","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"pith_short_12","alias_value":"6Z26G3SYNS6R","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_16","alias_value":"6Z26G3SYNS6RX4ZB","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_8","alias_value":"6Z26G3SY","created_at":"2026-05-18T12:30:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:6Z26G3SYNS6RX4ZBKHFAXF75A4","target":"record","payload":{"canonical_record":{"source":{"id":"1611.05321","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-11-16T15:33:12Z","cross_cats_sorted":[],"title_canon_sha256":"df7d24f7789c1aabf7bedd85e37aa16066d21a04a8d9928c53784e2b23767d8f","abstract_canon_sha256":"90002e8b80a175bd58f3a3326cdb3de886b05a42a5b559e81df94fbe0abd6889"},"schema_version":"1.0"},"canonical_sha256":"f675e36e586cbd1bf32151ca0b97fd07238ebee03258530a5974572b9033e51e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:41:47.869904Z","signature_b64":"WWuQhV9rAfJ8ZBMfn1hSZMz4OPOJ3jq+9W2ounM3Kw6gJgbFUYhA/n8eNK5J7xvRlZRHy73doi+asif5K7CWCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f675e36e586cbd1bf32151ca0b97fd07238ebee03258530a5974572b9033e51e","last_reissued_at":"2026-05-18T00:41:47.869249Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:41:47.869249Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1611.05321","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:41:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CZwZtg/82qleb4vgc8p2ojvPxl0+S4KP3JluV8Y/gRXeWuZ5AExsA63lsmsS+EMBIdA7+9CqlK4RDycJQGx3Bg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T06:33:52.863112Z"},"content_sha256":"21adc879003122460e2d161c935a5e850ff3e0a78fdcaa44d6240be42fcbb1ba","schema_version":"1.0","event_id":"sha256:21adc879003122460e2d161c935a5e850ff3e0a78fdcaa44d6240be42fcbb1ba"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:6Z26G3SYNS6RX4ZBKHFAXF75A4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Semi-supervised Framework for Image Captioning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Aurelien Lucchi, Thomas Hofmann, Wenhu Chen","submitted_at":"2016-11-16T15:33:12Z","abstract_excerpt":"State-of-the-art approaches for image captioning require supervised training data consisting of captions with paired image data. These methods are typically unable to use unsupervised data such as textual data with no corresponding images, which is a much more abundant commodity. We here propose a novel way of using such textual data by artificially generating missing visual information. We evaluate this learning approach on a newly designed model that detects visual concepts present in an image and feed them to a reviewer-decoder architecture with an attention mechanism. Unlike previous appro"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.05321","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:41:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UHTC4sEqvSGCO7jhBNYtiIlYy0beU4DJEz8HEFL5RfD8f/qOabRENuiOyECibIWeswAR7r4MsE1ZTSH9ZBndAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T06:33:52.863679Z"},"content_sha256":"cffe18f55df75d49076da533cde36ad6b5e85c0513ba460073638a5f644e5c2b","schema_version":"1.0","event_id":"sha256:cffe18f55df75d49076da533cde36ad6b5e85c0513ba460073638a5f644e5c2b"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/bundle.json","state_url":"https://pith.science/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T06:33:52Z","links":{"resolver":"https://pith.science/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4","bundle":"https://pith.science/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/bundle.json","state":"https://pith.science/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6Z26G3SYNS6RX4ZBKHFAXF75A4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:6Z26G3SYNS6RX4ZBKHFAXF75A4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"90002e8b80a175bd58f3a3326cdb3de886b05a42a5b559e81df94fbe0abd6889","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-11-16T15:33:12Z","title_canon_sha256":"df7d24f7789c1aabf7bedd85e37aa16066d21a04a8d9928c53784e2b23767d8f"},"schema_version":"1.0","source":{"id":"1611.05321","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.05321","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"arxiv_version","alias_value":"1611.05321v3","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.05321","created_at":"2026-05-18T00:41:47Z"},{"alias_kind":"pith_short_12","alias_value":"6Z26G3SYNS6R","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_16","alias_value":"6Z26G3SYNS6RX4ZB","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_8","alias_value":"6Z26G3SY","created_at":"2026-05-18T12:30:04Z"}],"graph_snapshots":[{"event_id":"sha256:cffe18f55df75d49076da533cde36ad6b5e85c0513ba460073638a5f644e5c2b","target":"graph","created_at":"2026-05-18T00:41:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"State-of-the-art approaches for image captioning require supervised training data consisting of captions with paired image data. These methods are typically unable to use unsupervised data such as textual data with no corresponding images, which is a much more abundant commodity. We here propose a novel way of using such textual data by artificially generating missing visual information. We evaluate this learning approach on a newly designed model that detects visual concepts present in an image and feed them to a reviewer-decoder architecture with an attention mechanism. Unlike previous appro","authors_text":"Aurelien Lucchi, Thomas Hofmann, Wenhu Chen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-11-16T15:33:12Z","title":"A Semi-supervised Framework for Image Captioning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.05321","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:21adc879003122460e2d161c935a5e850ff3e0a78fdcaa44d6240be42fcbb1ba","target":"record","created_at":"2026-05-18T00:41:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"90002e8b80a175bd58f3a3326cdb3de886b05a42a5b559e81df94fbe0abd6889","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-11-16T15:33:12Z","title_canon_sha256":"df7d24f7789c1aabf7bedd85e37aa16066d21a04a8d9928c53784e2b23767d8f"},"schema_version":"1.0","source":{"id":"1611.05321","kind":"arxiv","version":3}},"canonical_sha256":"f675e36e586cbd1bf32151ca0b97fd07238ebee03258530a5974572b9033e51e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f675e36e586cbd1bf32151ca0b97fd07238ebee03258530a5974572b9033e51e","first_computed_at":"2026-05-18T00:41:47.869249Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:41:47.869249Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"WWuQhV9rAfJ8ZBMfn1hSZMz4OPOJ3jq+9W2ounM3Kw6gJgbFUYhA/n8eNK5J7xvRlZRHy73doi+asif5K7CWCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:41:47.869904Z","signed_message":"canonical_sha256_bytes"},"source_id":"1611.05321","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:21adc879003122460e2d161c935a5e850ff3e0a78fdcaa44d6240be42fcbb1ba","sha256:cffe18f55df75d49076da533cde36ad6b5e85c0513ba460073638a5f644e5c2b"],"state_sha256":"85496f628f252a017b9893d4345078676a11f006fe7e6857958f82732c98b8e2"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"dXtA2E8Nup6F0JhFo4PbK2N2zb3Sun6fLiXXnHF1W5MtZpFVa6mBdeNpNib1yJwUEG+2Z6LP7rGkh3CLmiuFAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T06:33:52.866645Z","bundle_sha256":"dc5088dcf455f9e6ebdccd9c3825a21f1666cb6045d34a5649960c5e56753fcb"}}