{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:LNR5WQRRVUIBFL76SX4GYL6KXB","short_pith_number":"pith:LNR5WQRR","canonical_record":{"source":{"id":"1511.03292","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2015-11-10T21:14:51Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"64bc5d6f46ea656b11e7665b910110aef9fb8ee0a5e22ad13e53b716ec477d89","abstract_canon_sha256":"cd7d2190e2d267bd61afb630fa6f60ec47aa065482d330b9f0528f68b2232e9f"},"schema_version":"1.0"},"canonical_sha256":"5b63db4231ad1012affe95f86c2fcab84b6e70001cbd89adee64d7f483abf03c","source":{"kind":"arxiv","id":"1511.03292","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1511.03292","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"arxiv_version","alias_value":"1511.03292v1","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1511.03292","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"pith_short_12","alias_value":"LNR5WQRRVUIB","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_16","alias_value":"LNR5WQRRVUIBFL76","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_8","alias_value":"LNR5WQRR","created_at":"2026-05-18T12:29:29Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:LNR5WQRRVUIBFL76SX4GYL6KXB","target":"record","payload":{"canonical_record":{"source":{"id":"1511.03292","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2015-11-10T21:14:51Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"64bc5d6f46ea656b11e7665b910110aef9fb8ee0a5e22ad13e53b716ec477d89","abstract_canon_sha256":"cd7d2190e2d267bd61afb630fa6f60ec47aa065482d330b9f0528f68b2232e9f"},"schema_version":"1.0"},"canonical_sha256":"5b63db4231ad1012affe95f86c2fcab84b6e70001cbd89adee64d7f483abf03c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:27:15.838362Z","signature_b64":"obz/WqGNgFcuEbgrqNDbkw17AHtcnuUkbJI21bOo2YWUSRXuKEx2WkvCXkMavaq4AAKUDDf+aCVkM8MNk3/DBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5b63db4231ad1012affe95f86c2fcab84b6e70001cbd89adee64d7f483abf03c","last_reissued_at":"2026-05-18T01:27:15.837655Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:27:15.837655Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1511.03292","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:27:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"A4CBp2yrvj8RYb9pWPFB+wR8ocamnqzKEHcIb0vVX7BjeoDVAr/o51I5jojHz49o4v5EK82xzTUtbZRLdHQvDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T02:39:42.491516Z"},"content_sha256":"83e06988650c4dba3f45cea6218167845eb1a60cf35a0706033b67709c1c09f5","schema_version":"1.0","event_id":"sha256:83e06988650c4dba3f45cea6218167845eb1a60cf35a0706033b67709c1c09f5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:LNR5WQRRVUIBFL76SX4GYL6KXB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From Images to Sentences through Scene Description Graphs using Commonsense Reasoning and Knowledge","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.CV","authors_text":"Chitta Baral, Cornelia Fermuller, Somak Aditya, Yezhou Yang, Yiannis Aloimonos","submitted_at":"2015-11-10T21:14:51Z","abstract_excerpt":"In this paper we propose the construction of linguistic descriptions of images. This is achieved through the extraction of scene description graphs (SDGs) from visual scenes using an automatically constructed knowledge base. SDGs are constructed using both vision and reasoning. Specifically, commonsense reasoning is applied on (a) detections obtained from existing perception methods on given images, (b) a \"commonsense\" knowledge base constructed using natural language processing of image annotations and (c) lexical ontological knowledge from resources such as WordNet. Amazon Mechanical Turk(AM"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1511.03292","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:27:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ag6K2PdbKBbQZidx83dlwqKt6HdULd6AvN9ius2vH6XB91KFh8vBRRqZ240QaktKOlPZCtCUXWO9QCIAIMoTBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T02:39:42.492114Z"},"content_sha256":"6ccf2981956e4cc34984635dd449a178209e9738052f12f38ca505250c1015fa","schema_version":"1.0","event_id":"sha256:6ccf2981956e4cc34984635dd449a178209e9738052f12f38ca505250c1015fa"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/bundle.json","state_url":"https://pith.science/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T02:39:42Z","links":{"resolver":"https://pith.science/pith/LNR5WQRRVUIBFL76SX4GYL6KXB","bundle":"https://pith.science/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/bundle.json","state":"https://pith.science/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LNR5WQRRVUIBFL76SX4GYL6KXB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:LNR5WQRRVUIBFL76SX4GYL6KXB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"cd7d2190e2d267bd61afb630fa6f60ec47aa065482d330b9f0528f68b2232e9f","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2015-11-10T21:14:51Z","title_canon_sha256":"64bc5d6f46ea656b11e7665b910110aef9fb8ee0a5e22ad13e53b716ec477d89"},"schema_version":"1.0","source":{"id":"1511.03292","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1511.03292","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"arxiv_version","alias_value":"1511.03292v1","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1511.03292","created_at":"2026-05-18T01:27:15Z"},{"alias_kind":"pith_short_12","alias_value":"LNR5WQRRVUIB","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_16","alias_value":"LNR5WQRRVUIBFL76","created_at":"2026-05-18T12:29:29Z"},{"alias_kind":"pith_short_8","alias_value":"LNR5WQRR","created_at":"2026-05-18T12:29:29Z"}],"graph_snapshots":[{"event_id":"sha256:6ccf2981956e4cc34984635dd449a178209e9738052f12f38ca505250c1015fa","target":"graph","created_at":"2026-05-18T01:27:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In this paper we propose the construction of linguistic descriptions of images. This is achieved through the extraction of scene description graphs (SDGs) from visual scenes using an automatically constructed knowledge base. SDGs are constructed using both vision and reasoning. Specifically, commonsense reasoning is applied on (a) detections obtained from existing perception methods on given images, (b) a \"commonsense\" knowledge base constructed using natural language processing of image annotations and (c) lexical ontological knowledge from resources such as WordNet. Amazon Mechanical Turk(AM","authors_text":"Chitta Baral, Cornelia Fermuller, Somak Aditya, Yezhou Yang, Yiannis Aloimonos","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2015-11-10T21:14:51Z","title":"From Images to Sentences through Scene Description Graphs using Commonsense Reasoning and Knowledge"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1511.03292","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:83e06988650c4dba3f45cea6218167845eb1a60cf35a0706033b67709c1c09f5","target":"record","created_at":"2026-05-18T01:27:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"cd7d2190e2d267bd61afb630fa6f60ec47aa065482d330b9f0528f68b2232e9f","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2015-11-10T21:14:51Z","title_canon_sha256":"64bc5d6f46ea656b11e7665b910110aef9fb8ee0a5e22ad13e53b716ec477d89"},"schema_version":"1.0","source":{"id":"1511.03292","kind":"arxiv","version":1}},"canonical_sha256":"5b63db4231ad1012affe95f86c2fcab84b6e70001cbd89adee64d7f483abf03c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5b63db4231ad1012affe95f86c2fcab84b6e70001cbd89adee64d7f483abf03c","first_computed_at":"2026-05-18T01:27:15.837655Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:27:15.837655Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"obz/WqGNgFcuEbgrqNDbkw17AHtcnuUkbJI21bOo2YWUSRXuKEx2WkvCXkMavaq4AAKUDDf+aCVkM8MNk3/DBg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:27:15.838362Z","signed_message":"canonical_sha256_bytes"},"source_id":"1511.03292","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:83e06988650c4dba3f45cea6218167845eb1a60cf35a0706033b67709c1c09f5","sha256:6ccf2981956e4cc34984635dd449a178209e9738052f12f38ca505250c1015fa"],"state_sha256":"4f3f601ca2b2df04cd181f51276788268dc41e5ab14fc4bfd6ad908a83f0dde7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1kavI++JS/XCjrCCfjRk3Ey9rvSN68kiDQrNgkiEt9JofTt/LxaWYovzG+Ovdzmx++Jo4fVKsoI4xusNxFR/AQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T02:39:42.495618Z","bundle_sha256":"71660573c74a6f0e39afecffecdc6bf108bede6c6193f15dbde948fa8a776db1"}}