{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","short_pith_number":"pith:3VQFEKT7","canonical_record":{"source":{"id":"2605.19130","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T21:30:54Z","cross_cats_sorted":["cs.AI","cs.CL","cs.CV"],"title_canon_sha256":"b171157aab2f7f4a8379ee573b2c281e4b4eef5a2c43e692a8169f2af2504a41","abstract_canon_sha256":"4cf93700ebaf7433e1babebaf5190ad8cbfccc7df34c5dfbf0503cd87edec04d"},"schema_version":"1.0"},"canonical_sha256":"dd60522a7f3ddf6be772baef2ce5caa7f2c0f0e4a3228069541e1c1cf9731d1c","source":{"kind":"arxiv","id":"2605.19130","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19130","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19130v1","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19130","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_12","alias_value":"3VQFEKT7HXPW","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_16","alias_value":"3VQFEKT7HXPWXZ3S","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_8","alias_value":"3VQFEKT7","created_at":"2026-05-20T01:05:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","target":"record","payload":{"canonical_record":{"source":{"id":"2605.19130","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T21:30:54Z","cross_cats_sorted":["cs.AI","cs.CL","cs.CV"],"title_canon_sha256":"b171157aab2f7f4a8379ee573b2c281e4b4eef5a2c43e692a8169f2af2504a41","abstract_canon_sha256":"4cf93700ebaf7433e1babebaf5190ad8cbfccc7df34c5dfbf0503cd87edec04d"},"schema_version":"1.0"},"canonical_sha256":"dd60522a7f3ddf6be772baef2ce5caa7f2c0f0e4a3228069541e1c1cf9731d1c","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:28.752106Z","signature_b64":"E1b0+9YwprhgpPwW0j0rZ0jEXU3m7vKTHczs8/YNSH67rM+iVo9bK6Qo4TEJxfARZ5bUYj7BeVJsCrSWfyqxDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"dd60522a7f3ddf6be772baef2ce5caa7f2c0f0e4a3228069541e1c1cf9731d1c","last_reissued_at":"2026-05-20T01:05:28.751405Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:28.751405Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.19130","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"oCCxPmYL/XYqj9+0jPV65TFiaoIQGilpqreDydS+wLBMRPzRiJgiD+U24PUT+eV5FfbjapPExPY6zhU4lGJ1CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T01:41:36.878356Z"},"content_sha256":"deeef75329b2b6158e7dc9756aae4e578789bbfbd2a77afc278c0d2ac1817b27","schema_version":"1.0","event_id":"sha256:deeef75329b2b6158e7dc9756aae4e578789bbfbd2a77afc278c0d2ac1817b27"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"EgoBabyVLM: Benchmarking Cross-Modal Learning from Naturalistic Egocentric Video Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.CV"],"primary_cat":"cs.LG","authors_text":"Alvin W. M. Tan, Angel Villar Corrales, Bal\\'azs K\\'egl, Charles-\\'Eric Saint-James, Dongyan Lin, Emmanuel Dupoux, Jiayi Shen, Juan Pino, Mahi Luthra, Manel Khentout, Martin Gleize, Michael C. Frank, Nicolas Hamilakis, Phillip Rust, Rashel Moritz, Sheila Krogh-Jespersen, Sho Tsuji, Surya Parimi, Tom Fizycki, Vanessa Stark, Yosuke Higuchi, Youssef Benchekroun","submitted_at":"2026-05-18T21:30:54Z","abstract_excerpt":"Children acquire language grounding with remarkable robustness from limited visuo-linguistic input in ways that surpass today's best large multimodal models. Recent research suggests current vision-language models (VLMs) trained on curated web data fail to generalize to the sparse, weakly-aligned egocentric streams produced by wearable devices, embodied agents, and infant head-cams -- and no fixed evaluation pipeline exists for measuring progress on this regime. We train VLMs on datasets with varying degrees of semantic alignment between visual and linguistic inputs, including naturalistic inf"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19130","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19130/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:28Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ohdOxgmoOpb1mbUy+6jN+jcUJms5I1fwCZL84cntD8C2KeHNk4jHy3QvZvCwV3A8j8a07YJvECOMY/56YE9oBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T01:41:36.879066Z"},"content_sha256":"46ccd76018ae1b2f76e2fddaf7fccd3729bf4190d785fdcb1c21869821cd8771","schema_version":"1.0","event_id":"sha256:46ccd76018ae1b2f76e2fddaf7fccd3729bf4190d785fdcb1c21869821cd8771"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","target":"integrity","payload":{"note":"Identifier '10.5555/3692070.3694094' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Villalobos, P., Ho, A., Sevilla, J., Besiroglu, T., Heim, L., and Hobbhahn, M. Position: will we run out of data? limits of llm scaling based on human-generated data. In Proceedings of the 41st International Conference on Machine Learning, ","arxiv_id":"2605.19130","detector":"doi_compliance","evidence":{"doi":"10.5555/3692070.3694094","arxiv_id":null,"ref_index":54,"raw_excerpt":"Villalobos, P., Ho, A., Sevilla, J., Besiroglu, T., Heim, L., and Hobbhahn, M. Position: will we run out of data? limits of llm scaling based on human-generated data. In Proceedings of the 41st International Conference on Machine Learning, ICML'24. JMLR.org, 2024. URL https://dl.acm.org/doi/10.5555/3692070.3694094","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":54,"audited_at":"2026-05-20T12:22:14.614511Z","event_type":"pith.integrity.v1","detected_doi":"10.5555/3692070.3694094","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"89c76db84e5cead465d97a784df39f950c3e8bd80474cc1d840172ad9b5fbc8b","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5138,"payload_sha256":"3459540b36a11d1193a14d54b3a7ee1a83ef38411c147c5ea60f003fcb3a44ec","signature_b64":"gyoicwf0KBBBo9VDL8kAslIivAPAaP1lWxwfmaxprhpwEfHET6rZJKUym2FsYywSK4xQ68+pNrGzrV1BuIdwAw==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T12:22:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"B++PXhxDXfWROBy64Uec0EJbEV1gBLnkIZw/pd88oPV/feKWeMojhRy41oIiXIrrt/kOzEumeQa3LWlTAeLkDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T01:41:36.880669Z"},"content_sha256":"4d680357b1c39b5909327d74c60fc44dc58d9a42b8791f61da30f0af022503e0","schema_version":"1.0","event_id":"sha256:4d680357b1c39b5909327d74c60fc44dc58d9a42b8791f61da30f0af022503e0"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","target":"integrity","payload":{"note":"Identifier '10.5555/2969033.2969091' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Eigen, D., Puhrsch, C., and Fergus, R. Depth map prediction from a single image using a multi-scale deep network. In Proceedings of the 28th International Conference on Neural Information Processing Systems - Volume 2, NIPS'14, pp.\\ 2366–23","arxiv_id":"2605.19130","detector":"doi_compliance","evidence":{"doi":"10.5555/2969033.2969091","arxiv_id":null,"ref_index":16,"raw_excerpt":"Eigen, D., Puhrsch, C., and Fergus, R. Depth map prediction from a single image using a multi-scale deep network. In Proceedings of the 28th International Conference on Neural Information Processing Systems - Volume 2, NIPS'14, pp.\\ 2366–2374, Cambridge, MA, USA, 2014. MIT Press. URL https://dl.acm.org/doi/10.5555/2969033.2969091","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":16,"audited_at":"2026-05-20T12:22:14.614511Z","event_type":"pith.integrity.v1","detected_doi":"10.5555/2969033.2969091","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"da594c9f83f52e6e63ca9f4af00598cb083f2d0ef070f1baea5741e045df4ef1","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5137,"payload_sha256":"1690ea9504b818f321139d1edac0da7c0d271aea585fb9db191103d7ccae93e7","signature_b64":"iWlk+LWCfEZMpzOhj1gFv7h+mmvZohpYgL0ohUH5DpydgSs5pOlJYJWS2Nk5AuWewbhdQVCOXadjroq7MYPyDw==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T12:22:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Pv0Yn+la+QowxA5zzbBTYJkU4aeu4Hd/QXikyY1x2MzhnfduUl/1DSGnntPXvVDcVxBzARrA6+Pbxq8azIPdCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T01:41:36.881260Z"},"content_sha256":"7babf9effee148a382851670f26676f65337b080773cb8ca5177f234f8ef44fd","schema_version":"1.0","event_id":"sha256:7babf9effee148a382851670f26676f65337b080773cb8ca5177f234f8ef44fd"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","target":"integrity","payload":{"note":"Identifier '10.5555/3600270.3601993' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Alayrac, J.-B., Donahue, J., Luc, P., Miech, A., Barr, I., Hasson, Y., Lenc, K., Mensch, A., Millican, K., Reynolds, M., et al. Flamingo: a visual language model for few-shot learning. Advances in neural information processing systems, 35: ","arxiv_id":"2605.19130","detector":"doi_compliance","evidence":{"doi":"10.5555/3600270.3601993","arxiv_id":null,"ref_index":1,"raw_excerpt":"Alayrac, J.-B., Donahue, J., Luc, P., Miech, A., Barr, I., Hasson, Y., Lenc, K., Mensch, A., Millican, K., Reynolds, M., et al. Flamingo: a visual language model for few-shot learning. Advances in neural information processing systems, 35: 0 23716--23736, 2022. URL https://dl.acm.org/doi/10.5555/3600270.3601993","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":1,"audited_at":"2026-05-20T12:22:14.614511Z","event_type":"pith.integrity.v1","detected_doi":"10.5555/3600270.3601993","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"2718114ee3c35f0913114cd751715fa9b436404f7ed97bd42273c7e629a103b9","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5136,"payload_sha256":"359a467bbf689300141b58e18012bd1b167320ad53ebbe512c8fe46576408376","signature_b64":"0xZlY/uV8iScO6ha/xPOWr5ONcVSjN6MLhugytkI8C5kqCa2GdzkK9YzVXxpRF8MWIKm3cUevs6YmAoJoCQqCw==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T12:22:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OP2dcU8cOsDyb5cUmH22KJVjJgWVxDNh+mt9iiBZbWP+P1fsrCvJoqttJsLzubWyD2dBn2g5/O00uPTT7bkwDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-22T01:41:36.881834Z"},"content_sha256":"dadaff7c08f6f0d8b580192206520ce6dbdff0152daca29ba59323d5bb3c1ac9","schema_version":"1.0","event_id":"sha256:dadaff7c08f6f0d8b580192206520ce6dbdff0152daca29ba59323d5bb3c1ac9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/bundle.json","state_url":"https://pith.science/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-22T01:41:36Z","links":{"resolver":"https://pith.science/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7","bundle":"https://pith.science/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/bundle.json","state":"https://pith.science/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3VQFEKT7HXPWXZ3SXLXSZZOKU7/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3VQFEKT7HXPWXZ3SXLXSZZOKU7","merge_version":"pith-open-graph-merge-v1","event_count":5,"valid_event_count":5,"invalid_event_count":0,"equivocation_count":1,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4cf93700ebaf7433e1babebaf5190ad8cbfccc7df34c5dfbf0503cd87edec04d","cross_cats_sorted":["cs.AI","cs.CL","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T21:30:54Z","title_canon_sha256":"b171157aab2f7f4a8379ee573b2c281e4b4eef5a2c43e692a8169f2af2504a41"},"schema_version":"1.0","source":{"id":"2605.19130","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19130","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19130v1","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19130","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_12","alias_value":"3VQFEKT7HXPW","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_16","alias_value":"3VQFEKT7HXPWXZ3S","created_at":"2026-05-20T01:05:28Z"},{"alias_kind":"pith_short_8","alias_value":"3VQFEKT7","created_at":"2026-05-20T01:05:28Z"}],"graph_snapshots":[{"event_id":"sha256:46ccd76018ae1b2f76e2fddaf7fccd3729bf4190d785fdcb1c21869821cd8771","target":"graph","created_at":"2026-05-20T01:05:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.19130/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Children acquire language grounding with remarkable robustness from limited visuo-linguistic input in ways that surpass today's best large multimodal models. Recent research suggests current vision-language models (VLMs) trained on curated web data fail to generalize to the sparse, weakly-aligned egocentric streams produced by wearable devices, embodied agents, and infant head-cams -- and no fixed evaluation pipeline exists for measuring progress on this regime. We train VLMs on datasets with varying degrees of semantic alignment between visual and linguistic inputs, including naturalistic inf","authors_text":"Alvin W. M. Tan, Angel Villar Corrales, Bal\\'azs K\\'egl, Charles-\\'Eric Saint-James, Dongyan Lin, Emmanuel Dupoux, Jiayi Shen, Juan Pino, Mahi Luthra, Manel Khentout, Martin Gleize, Michael C. Frank, Nicolas Hamilakis, Phillip Rust, Rashel Moritz, Sheila Krogh-Jespersen, Sho Tsuji, Surya Parimi, Tom Fizycki, Vanessa Stark, Yosuke Higuchi, Youssef Benchekroun","cross_cats":["cs.AI","cs.CL","cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T21:30:54Z","title":"EgoBabyVLM: Benchmarking Cross-Modal Learning from Naturalistic Egocentric Video Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19130","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:deeef75329b2b6158e7dc9756aae4e578789bbfbd2a77afc278c0d2ac1817b27","target":"record","created_at":"2026-05-20T01:05:28Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4cf93700ebaf7433e1babebaf5190ad8cbfccc7df34c5dfbf0503cd87edec04d","cross_cats_sorted":["cs.AI","cs.CL","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T21:30:54Z","title_canon_sha256":"b171157aab2f7f4a8379ee573b2c281e4b4eef5a2c43e692a8169f2af2504a41"},"schema_version":"1.0","source":{"id":"2605.19130","kind":"arxiv","version":1}},"canonical_sha256":"dd60522a7f3ddf6be772baef2ce5caa7f2c0f0e4a3228069541e1c1cf9731d1c","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"dd60522a7f3ddf6be772baef2ce5caa7f2c0f0e4a3228069541e1c1cf9731d1c","first_computed_at":"2026-05-20T01:05:28.751405Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:05:28.751405Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"E1b0+9YwprhgpPwW0j0rZ0jEXU3m7vKTHczs8/YNSH67rM+iVo9bK6Qo4TEJxfARZ5bUYj7BeVJsCrSWfyqxDQ==","signature_status":"signed_v1","signed_at":"2026-05-20T01:05:28.752106Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.19130","source_kind":"arxiv","source_version":1}}},"equivocations":[{"signer_id":"pith.science","event_type":"integrity_finding","target":"integrity","event_ids":["sha256:4d680357b1c39b5909327d74c60fc44dc58d9a42b8791f61da30f0af022503e0","sha256:7babf9effee148a382851670f26676f65337b080773cb8ca5177f234f8ef44fd","sha256:dadaff7c08f6f0d8b580192206520ce6dbdff0152daca29ba59323d5bb3c1ac9"]}],"invalid_events":[],"applied_event_ids":["sha256:deeef75329b2b6158e7dc9756aae4e578789bbfbd2a77afc278c0d2ac1817b27","sha256:46ccd76018ae1b2f76e2fddaf7fccd3729bf4190d785fdcb1c21869821cd8771"],"state_sha256":"51174f4d136ae715a52288e71cca370053e5da6af6ec0b3570b07d67fb9e6e54"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3eETiajQhujWUa/PtDMnVy0s7OrxWrYz4FdgZ9qoW/FGVsLCPySKeC+CRmg8Kf3cqeYGDbM03dD7r0yJEPArDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-22T01:41:36.886226Z","bundle_sha256":"9966dd529f4df9881aea955234221afd566110770a01f3c695b5bc09c348b88f"}}