{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:WCDBLO2D7HHBA53EKBCFKUAQIE","short_pith_number":"pith:WCDBLO2D","canonical_record":{"source":{"id":"1811.05253","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-13T12:31:26Z","cross_cats_sorted":[],"title_canon_sha256":"f8f9e6c8f2043ca63a7dbe1e8789de02d7137e49e08cc8c896223926c99eb1f1","abstract_canon_sha256":"4ea0a1b0845c7831b2c44c864d2d6ebb5ee54b0a37c8fcf1e92e9966f20a25fc"},"schema_version":"1.0"},"canonical_sha256":"b08615bb43f9ce1077645044555010412e091da10bc7819690476d63308c880e","source":{"kind":"arxiv","id":"1811.05253","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.05253","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"arxiv_version","alias_value":"1811.05253v2","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.05253","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"pith_short_12","alias_value":"WCDBLO2D7HHB","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_16","alias_value":"WCDBLO2D7HHBA53E","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_8","alias_value":"WCDBLO2D","created_at":"2026-05-18T12:32:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:WCDBLO2D7HHBA53EKBCFKUAQIE","target":"record","payload":{"canonical_record":{"source":{"id":"1811.05253","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-13T12:31:26Z","cross_cats_sorted":[],"title_canon_sha256":"f8f9e6c8f2043ca63a7dbe1e8789de02d7137e49e08cc8c896223926c99eb1f1","abstract_canon_sha256":"4ea0a1b0845c7831b2c44c864d2d6ebb5ee54b0a37c8fcf1e92e9966f20a25fc"},"schema_version":"1.0"},"canonical_sha256":"b08615bb43f9ce1077645044555010412e091da10bc7819690476d63308c880e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:33.344296Z","signature_b64":"1ar/+g0w8oQLT7WnNIYgsPvpvPJZgEjUp8mqochrk9Mpxg+PVp4k0FQ0AzIrcGln4ly4Mg+eawaa2/hRhx6aCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b08615bb43f9ce1077645044555010412e091da10bc7819690476d63308c880e","last_reissued_at":"2026-05-17T23:56:33.343613Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:33.343613Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.05253","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KxNuMMqDEgyL46GUKYMrc7P2Y4x7qBVFVL6J2RRKnGinMZf5zPUZxdGz6FnH0o51eyjigenPS9IKwsJbT0QkAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T19:45:28.102296Z"},"content_sha256":"0e238dfefded083597703fe9f103738a94ad5d5b8f5f38486bbf2b60467346a3","schema_version":"1.0","event_id":"sha256:0e238dfefded083597703fe9f103738a94ad5d5b8f5f38486bbf2b60467346a3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:WCDBLO2D7HHBA53EKBCFKUAQIE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Image Captioning Based on a Hierarchical Attention Mechanism and Policy Gradient Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bailing Zhang, Fangyu Wu, Jeremy S. Smith, Shiyang Yan, Wenjin Lu, Yuan Xie","submitted_at":"2018-11-13T12:31:26Z","abstract_excerpt":"Automatically generating the descriptions of an image, i.e., image captioning, is an important and fundamental topic in artificial intelligence, which bridges the gap between computer vision and natural language processing. Based on the successful deep learning models, especially the CNN model and Long Short-Term Memories (LSTMs) with attention mechanism, we propose a hierarchical attention model by utilizing both of the global CNN features and the local object features for more effective feature representation and reasoning in image captioning. The generative adversarial network (GAN), togeth"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.05253","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:33Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FcHk3pYD2fBTa3VgnsymHLytluwtmSb47ofoWaGhvLq2cmcwwGpqqlWolcZFCI0gU97HEFuBsXdJCNOs4kQSAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T19:45:28.102682Z"},"content_sha256":"997154135bcdc662852cfe2cacdf77837c43a37a0019250d46ef22c6e7ab2274","schema_version":"1.0","event_id":"sha256:997154135bcdc662852cfe2cacdf77837c43a37a0019250d46ef22c6e7ab2274"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/bundle.json","state_url":"https://pith.science/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T19:45:28Z","links":{"resolver":"https://pith.science/pith/WCDBLO2D7HHBA53EKBCFKUAQIE","bundle":"https://pith.science/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/bundle.json","state":"https://pith.science/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WCDBLO2D7HHBA53EKBCFKUAQIE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:WCDBLO2D7HHBA53EKBCFKUAQIE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4ea0a1b0845c7831b2c44c864d2d6ebb5ee54b0a37c8fcf1e92e9966f20a25fc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-13T12:31:26Z","title_canon_sha256":"f8f9e6c8f2043ca63a7dbe1e8789de02d7137e49e08cc8c896223926c99eb1f1"},"schema_version":"1.0","source":{"id":"1811.05253","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.05253","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"arxiv_version","alias_value":"1811.05253v2","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.05253","created_at":"2026-05-17T23:56:33Z"},{"alias_kind":"pith_short_12","alias_value":"WCDBLO2D7HHB","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_16","alias_value":"WCDBLO2D7HHBA53E","created_at":"2026-05-18T12:32:59Z"},{"alias_kind":"pith_short_8","alias_value":"WCDBLO2D","created_at":"2026-05-18T12:32:59Z"}],"graph_snapshots":[{"event_id":"sha256:997154135bcdc662852cfe2cacdf77837c43a37a0019250d46ef22c6e7ab2274","target":"graph","created_at":"2026-05-17T23:56:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Automatically generating the descriptions of an image, i.e., image captioning, is an important and fundamental topic in artificial intelligence, which bridges the gap between computer vision and natural language processing. Based on the successful deep learning models, especially the CNN model and Long Short-Term Memories (LSTMs) with attention mechanism, we propose a hierarchical attention model by utilizing both of the global CNN features and the local object features for more effective feature representation and reasoning in image captioning. The generative adversarial network (GAN), togeth","authors_text":"Bailing Zhang, Fangyu Wu, Jeremy S. Smith, Shiyang Yan, Wenjin Lu, Yuan Xie","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-13T12:31:26Z","title":"Image Captioning Based on a Hierarchical Attention Mechanism and Policy Gradient Optimization"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.05253","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0e238dfefded083597703fe9f103738a94ad5d5b8f5f38486bbf2b60467346a3","target":"record","created_at":"2026-05-17T23:56:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4ea0a1b0845c7831b2c44c864d2d6ebb5ee54b0a37c8fcf1e92e9966f20a25fc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-11-13T12:31:26Z","title_canon_sha256":"f8f9e6c8f2043ca63a7dbe1e8789de02d7137e49e08cc8c896223926c99eb1f1"},"schema_version":"1.0","source":{"id":"1811.05253","kind":"arxiv","version":2}},"canonical_sha256":"b08615bb43f9ce1077645044555010412e091da10bc7819690476d63308c880e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b08615bb43f9ce1077645044555010412e091da10bc7819690476d63308c880e","first_computed_at":"2026-05-17T23:56:33.343613Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:56:33.343613Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1ar/+g0w8oQLT7WnNIYgsPvpvPJZgEjUp8mqochrk9Mpxg+PVp4k0FQ0AzIrcGln4ly4Mg+eawaa2/hRhx6aCA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:56:33.344296Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.05253","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0e238dfefded083597703fe9f103738a94ad5d5b8f5f38486bbf2b60467346a3","sha256:997154135bcdc662852cfe2cacdf77837c43a37a0019250d46ef22c6e7ab2274"],"state_sha256":"4bcfa760e4df3243192403ba00c8f7fdb3539b403c6f2421cb602824bde4781e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xt5AebzI6p7xEWhfV5z+BtI2NvVDIoT/5UaDSkSZZwp4oWVU7lkFh3+jU74kM7ya5/ngj6RPizpjqZeUBbjcDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T19:45:28.104698Z","bundle_sha256":"591763ba26461b8d15e009431c942b18043fed4098bd753de54b29ca441e4a82"}}