{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:SDLMQVVZVW7TTYXQ3UQT7RV6JQ","short_pith_number":"pith:SDLMQVVZ","canonical_record":{"source":{"id":"1612.01033","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-03T23:01:36Z","cross_cats_sorted":[],"title_canon_sha256":"ab16bcaf0e8bafc82093f2a0ebfda7dbd60ae3d7baf9b5d2dbec36b50bed9abc","abstract_canon_sha256":"5071a7cc5e07f2b7e27fd756e24d5f8639d96ad5d564886b6c19a8de03324765"},"schema_version":"1.0"},"canonical_sha256":"90d6c856b9adbf39e2f0dd213fc6be4c0eaf060e0f92d8d965d9278567cf6577","source":{"kind":"arxiv","id":"1612.01033","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.01033","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"arxiv_version","alias_value":"1612.01033v2","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.01033","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"pith_short_12","alias_value":"SDLMQVVZVW7T","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_16","alias_value":"SDLMQVVZVW7TTYXQ","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_8","alias_value":"SDLMQVVZ","created_at":"2026-05-18T12:30:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:SDLMQVVZVW7TTYXQ3UQT7RV6JQ","target":"record","payload":{"canonical_record":{"source":{"id":"1612.01033","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-03T23:01:36Z","cross_cats_sorted":[],"title_canon_sha256":"ab16bcaf0e8bafc82093f2a0ebfda7dbd60ae3d7baf9b5d2dbec36b50bed9abc","abstract_canon_sha256":"5071a7cc5e07f2b7e27fd756e24d5f8639d96ad5d564886b6c19a8de03324765"},"schema_version":"1.0"},"canonical_sha256":"90d6c856b9adbf39e2f0dd213fc6be4c0eaf060e0f92d8d965d9278567cf6577","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:36:43.658938Z","signature_b64":"41FjedlB60Aj03RlwAT9LePaY0xH0udrjI5/a+OYZOCkIyj08ik8lIgKlPpF9EvJVdWYE26DPlJPh+2KsXVLCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"90d6c856b9adbf39e2f0dd213fc6be4c0eaf060e0f92d8d965d9278567cf6577","last_reissued_at":"2026-05-18T00:36:43.658277Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:36:43.658277Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1612.01033","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:36:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/gkHn2gWnvB5dl9hSf8WrSSu7C7UzjIfCsB2f9E2b5HPUNMIwgmqez2mHz0V+J97VJ5Uos/U59WzAjpP6B2XDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T10:44:46.730206Z"},"content_sha256":"e03aef021172f578a1128199e6e3e04ae2b7158f0ee2f7d60e5ccbdb837aff6b","schema_version":"1.0","event_id":"sha256:e03aef021172f578a1128199e6e3e04ae2b7158f0ee2f7d60e5ccbdb837aff6b"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:SDLMQVVZVW7TTYXQ3UQT7RV6JQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Areas of Attention for Image Captioning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Cordelia Schmid, Jakob Verbeek, Marco Pedersoli, Thomas Lucas","submitted_at":"2016-12-03T23:01:36Z","abstract_excerpt":"We propose \"Areas of Attention\", a novel attention-based model for automatic image captioning. Our approach models the dependencies between image regions, caption words, and the state of an RNN language model, using three pairwise interactions. In contrast to previous attention-based approaches that associate image regions only to the RNN state, our method allows a direct association between caption words and image regions. During training these associations are inferred from image-level captions, akin to weakly-supervised object detector training. These associations help to improve captioning"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.01033","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:36:43Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FGYLOLLxgT/R3sfN7UZeqTh3Gh1H9pQUI62a+X34oL65I4W4wQNOMCVjnUh5uHCEk9ZYL02Jrrla4tMkgBwQDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T10:44:46.730827Z"},"content_sha256":"df00ca39d8142f296dc5c298c84f3a74120a4d00e5d9ac19b8768db830c9fb79","schema_version":"1.0","event_id":"sha256:df00ca39d8142f296dc5c298c84f3a74120a4d00e5d9ac19b8768db830c9fb79"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/bundle.json","state_url":"https://pith.science/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T10:44:46Z","links":{"resolver":"https://pith.science/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ","bundle":"https://pith.science/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/bundle.json","state":"https://pith.science/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SDLMQVVZVW7TTYXQ3UQT7RV6JQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:SDLMQVVZVW7TTYXQ3UQT7RV6JQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5071a7cc5e07f2b7e27fd756e24d5f8639d96ad5d564886b6c19a8de03324765","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-03T23:01:36Z","title_canon_sha256":"ab16bcaf0e8bafc82093f2a0ebfda7dbd60ae3d7baf9b5d2dbec36b50bed9abc"},"schema_version":"1.0","source":{"id":"1612.01033","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1612.01033","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"arxiv_version","alias_value":"1612.01033v2","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.01033","created_at":"2026-05-18T00:36:43Z"},{"alias_kind":"pith_short_12","alias_value":"SDLMQVVZVW7T","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_16","alias_value":"SDLMQVVZVW7TTYXQ","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_8","alias_value":"SDLMQVVZ","created_at":"2026-05-18T12:30:44Z"}],"graph_snapshots":[{"event_id":"sha256:df00ca39d8142f296dc5c298c84f3a74120a4d00e5d9ac19b8768db830c9fb79","target":"graph","created_at":"2026-05-18T00:36:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We propose \"Areas of Attention\", a novel attention-based model for automatic image captioning. Our approach models the dependencies between image regions, caption words, and the state of an RNN language model, using three pairwise interactions. In contrast to previous attention-based approaches that associate image regions only to the RNN state, our method allows a direct association between caption words and image regions. During training these associations are inferred from image-level captions, akin to weakly-supervised object detector training. These associations help to improve captioning","authors_text":"Cordelia Schmid, Jakob Verbeek, Marco Pedersoli, Thomas Lucas","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-03T23:01:36Z","title":"Areas of Attention for Image Captioning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.01033","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e03aef021172f578a1128199e6e3e04ae2b7158f0ee2f7d60e5ccbdb837aff6b","target":"record","created_at":"2026-05-18T00:36:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5071a7cc5e07f2b7e27fd756e24d5f8639d96ad5d564886b6c19a8de03324765","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-12-03T23:01:36Z","title_canon_sha256":"ab16bcaf0e8bafc82093f2a0ebfda7dbd60ae3d7baf9b5d2dbec36b50bed9abc"},"schema_version":"1.0","source":{"id":"1612.01033","kind":"arxiv","version":2}},"canonical_sha256":"90d6c856b9adbf39e2f0dd213fc6be4c0eaf060e0f92d8d965d9278567cf6577","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"90d6c856b9adbf39e2f0dd213fc6be4c0eaf060e0f92d8d965d9278567cf6577","first_computed_at":"2026-05-18T00:36:43.658277Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:36:43.658277Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"41FjedlB60Aj03RlwAT9LePaY0xH0udrjI5/a+OYZOCkIyj08ik8lIgKlPpF9EvJVdWYE26DPlJPh+2KsXVLCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:36:43.658938Z","signed_message":"canonical_sha256_bytes"},"source_id":"1612.01033","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e03aef021172f578a1128199e6e3e04ae2b7158f0ee2f7d60e5ccbdb837aff6b","sha256:df00ca39d8142f296dc5c298c84f3a74120a4d00e5d9ac19b8768db830c9fb79"],"state_sha256":"faecfd1c544df42fe8d5cab74ea5e0bdc56fa8a26e2c6c45e5333b8997397f8e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WXdqs37EHpgOMDwZWlK47a7DesZGqYBv01slDPEE6Ra9pQ6/smT0AJ6Uf/BV9AOy4qq5aYWFUYaELRPR3zR/Dg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T10:44:46.734700Z","bundle_sha256":"b236607fc66d1584d6103520c0a5fc633ea82934c6ff9b6c3730f6a1d6aac632"}}