{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:V6Y3XUV3H7TUMGMWG7FDM4LBAW","short_pith_number":"pith:V6Y3XUV3","canonical_record":{"source":{"id":"1905.13358","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-05-31T00:07:24Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"9dc84ffcae064a656739c56fbe03ae69968ccb2663fd6bf343598d9a0a754cc1","abstract_canon_sha256":"bfb39efed5d727e9e4a119106af59108e163a810374b4ecf5d81bed45bcbf6c3"},"schema_version":"1.0"},"canonical_sha256":"afb1bbd2bb3fe746199637ca367161059c44638eff6cf5ab8e7e6aafb9a06f71","source":{"kind":"arxiv","id":"1905.13358","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.13358","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"arxiv_version","alias_value":"1905.13358v1","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.13358","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"pith_short_12","alias_value":"V6Y3XUV3H7TU","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"V6Y3XUV3H7TUMGMW","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"V6Y3XUV3","created_at":"2026-05-18T12:33:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:V6Y3XUV3H7TUMGMWG7FDM4LBAW","target":"record","payload":{"canonical_record":{"source":{"id":"1905.13358","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-05-31T00:07:24Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"9dc84ffcae064a656739c56fbe03ae69968ccb2663fd6bf343598d9a0a754cc1","abstract_canon_sha256":"bfb39efed5d727e9e4a119106af59108e163a810374b4ecf5d81bed45bcbf6c3"},"schema_version":"1.0"},"canonical_sha256":"afb1bbd2bb3fe746199637ca367161059c44638eff6cf5ab8e7e6aafb9a06f71","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:44:35.193559Z","signature_b64":"jyWm3cUR0e292qNugcMuqNrn8kQSR9JthxOuXLzv+Z0JUxHr2tKVPMvQLt4KzADAHcCf8iHdVPXAALHX4/BoDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"afb1bbd2bb3fe746199637ca367161059c44638eff6cf5ab8e7e6aafb9a06f71","last_reissued_at":"2026-05-17T23:44:35.193026Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:44:35.193026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1905.13358","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8UxPRGiPjxj2qHCQ2kAjpw08Kc5OdSNq52rawgtU/STCbY69HC4E/wqXHr1yvWOE3Af2BnJobAyK5a61qKyyCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T05:58:22.946368Z"},"content_sha256":"6a011cdec4a343b6cf130480d3e5b9913c3f05e3cc5317b858b3ea8cec0f89ba","schema_version":"1.0","event_id":"sha256:6a011cdec4a343b6cf130480d3e5b9913c3f05e3cc5317b858b3ea8cec0f89ba"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:V6Y3XUV3H7TUMGMWG7FDM4LBAW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Multi-modal Discriminative Model for Vision-and-Language Navigation","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.CV"],"primary_cat":"cs.CL","authors_text":"Eugene Ie, Haoshuo Huang, Harsh Mehta, Jason Baldridge, Vihan Jain","submitted_at":"2019-05-31T00:07:24Z","abstract_excerpt":"Vision-and-Language Navigation (VLN) is a natural language grounding task where agents have to interpret natural language instructions in the context of visual scenes in a dynamic environment to achieve prescribed navigation goals. Successful agents must have the ability to parse natural language of varying linguistic styles, ground them in potentially unfamiliar scenes, plan and react with ambiguous environmental feedback. Generalization ability is limited by the amount of human annotated data. In particular, \\emph{paired} vision-language sequence data is expensive to collect. We develop a di"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.13358","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:44:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hHN431c3C60b0lXl9gt3LsIiho77mEeG5VXZuv8gNOHvJuX7Z6Pvuval2V+kHg2tL0h9F5pZDjgPZfNJpS9NAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T05:58:22.946817Z"},"content_sha256":"8866458b8a4ae1e43be1e7776bd038e8523a17c0437d71a577ee16283b2710e5","schema_version":"1.0","event_id":"sha256:8866458b8a4ae1e43be1e7776bd038e8523a17c0437d71a577ee16283b2710e5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/bundle.json","state_url":"https://pith.science/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T05:58:22Z","links":{"resolver":"https://pith.science/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW","bundle":"https://pith.science/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/bundle.json","state":"https://pith.science/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/V6Y3XUV3H7TUMGMWG7FDM4LBAW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:V6Y3XUV3H7TUMGMWG7FDM4LBAW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"bfb39efed5d727e9e4a119106af59108e163a810374b4ecf5d81bed45bcbf6c3","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-05-31T00:07:24Z","title_canon_sha256":"9dc84ffcae064a656739c56fbe03ae69968ccb2663fd6bf343598d9a0a754cc1"},"schema_version":"1.0","source":{"id":"1905.13358","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1905.13358","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"arxiv_version","alias_value":"1905.13358v1","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1905.13358","created_at":"2026-05-17T23:44:35Z"},{"alias_kind":"pith_short_12","alias_value":"V6Y3XUV3H7TU","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_16","alias_value":"V6Y3XUV3H7TUMGMW","created_at":"2026-05-18T12:33:30Z"},{"alias_kind":"pith_short_8","alias_value":"V6Y3XUV3","created_at":"2026-05-18T12:33:30Z"}],"graph_snapshots":[{"event_id":"sha256:8866458b8a4ae1e43be1e7776bd038e8523a17c0437d71a577ee16283b2710e5","target":"graph","created_at":"2026-05-17T23:44:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Vision-and-Language Navigation (VLN) is a natural language grounding task where agents have to interpret natural language instructions in the context of visual scenes in a dynamic environment to achieve prescribed navigation goals. Successful agents must have the ability to parse natural language of varying linguistic styles, ground them in potentially unfamiliar scenes, plan and react with ambiguous environmental feedback. Generalization ability is limited by the amount of human annotated data. In particular, \\emph{paired} vision-language sequence data is expensive to collect. We develop a di","authors_text":"Eugene Ie, Haoshuo Huang, Harsh Mehta, Jason Baldridge, Vihan Jain","cross_cats":["cs.CV"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-05-31T00:07:24Z","title":"Multi-modal Discriminative Model for Vision-and-Language Navigation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1905.13358","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6a011cdec4a343b6cf130480d3e5b9913c3f05e3cc5317b858b3ea8cec0f89ba","target":"record","created_at":"2026-05-17T23:44:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"bfb39efed5d727e9e4a119106af59108e163a810374b4ecf5d81bed45bcbf6c3","cross_cats_sorted":["cs.CV"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2019-05-31T00:07:24Z","title_canon_sha256":"9dc84ffcae064a656739c56fbe03ae69968ccb2663fd6bf343598d9a0a754cc1"},"schema_version":"1.0","source":{"id":"1905.13358","kind":"arxiv","version":1}},"canonical_sha256":"afb1bbd2bb3fe746199637ca367161059c44638eff6cf5ab8e7e6aafb9a06f71","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"afb1bbd2bb3fe746199637ca367161059c44638eff6cf5ab8e7e6aafb9a06f71","first_computed_at":"2026-05-17T23:44:35.193026Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:44:35.193026Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"jyWm3cUR0e292qNugcMuqNrn8kQSR9JthxOuXLzv+Z0JUxHr2tKVPMvQLt4KzADAHcCf8iHdVPXAALHX4/BoDg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:44:35.193559Z","signed_message":"canonical_sha256_bytes"},"source_id":"1905.13358","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6a011cdec4a343b6cf130480d3e5b9913c3f05e3cc5317b858b3ea8cec0f89ba","sha256:8866458b8a4ae1e43be1e7776bd038e8523a17c0437d71a577ee16283b2710e5"],"state_sha256":"ec52776805a241499eae69901de7a6ae9ab203c5ec2ff0d12628a964659cd37d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FfiTKIVR/Ejo2ln9TUxEYWxxhS6UIxvgfVQBm/Dtf/rEK4nqM3CED+ImfMOd3u/QBHSGv7aCtpi100qtn/JhCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T05:58:22.949104Z","bundle_sha256":"948f240c6b8f5de8170cf51ece3db0b5c4619cec231e86145527f5d051a1a0bd"}}