{"schema":"https://pith.science/schemas/pith-integrity/v1.json","pith_number":"2604.22226","arxiv_id":"2604.22226","integrity":{"available":true,"endpoint":"/pith/2604.22226/integrity.json","summary":{"critical":27,"advisory":0,"informational":0,"by_detector":{"doi_compliance":{"total":27,"critical":27,"advisory":0,"informational":0}}},"clean":false,"detectors_run":[{"name":"ai_meta_artifact","version":"1.0.0","status":"completed","ran_at":"2026-05-21T11:34:50.807535Z","findings_count":0},{"name":"doi_compliance","version":"1.0.0","status":"completed","ran_at":"2026-05-20T00:12:39.924367Z","findings_count":27}],"findings":[{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2511.216311' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2511.216311","detected_arxiv_id":null,"ref_index":2,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2509.2366112' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2509.2366112","detected_arxiv_id":null,"ref_index":1,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2412.120752' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2412.120752","detected_arxiv_id":null,"ref_index":3,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2601.106111' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2601.106111","detected_arxiv_id":null,"ref_index":5,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2412.0527111' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2412.0527111","detected_arxiv_id":null,"ref_index":4,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2401.015057' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2401.015057","detected_arxiv_id":null,"ref_index":16,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.1007/978-3-031-72652-1_64' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.1007/978-3-031-72652-1_64","detected_arxiv_id":null,"ref_index":19,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2512.055134' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2512.055134","detected_arxiv_id":null,"ref_index":28,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2406.163382' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2406.163382","detected_arxiv_id":null,"ref_index":35,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2506.094454' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2506.094454","detected_arxiv_id":null,"ref_index":12,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.1109/iccv51070.2023.012752' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.1109/iccv51070.2023.012752","detected_arxiv_id":null,"ref_index":18,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2402.0330013' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2402.0330013","detected_arxiv_id":null,"ref_index":27,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2507.133534' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2507.133534","detected_arxiv_id":null,"ref_index":32,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2511.064994' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2511.064994","detected_arxiv_id":null,"ref_index":39,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2501.139194' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2501.139194","detected_arxiv_id":null,"ref_index":17,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2508.1173712' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2508.1173712","detected_arxiv_id":null,"ref_index":21,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2410.032904' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2410.032904","detected_arxiv_id":null,"ref_index":31,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2510.182349' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2510.182349","detected_arxiv_id":null,"ref_index":36,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2410.084744' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2410.084744","detected_arxiv_id":null,"ref_index":41,"audited_at":"2026-05-20T00:12:39.924367Z"},{"detector":"doi_compliance","finding_type":"unresolvable_identifier","severity":"critical","verdict_class":"cross_source","note":"Identifier '10.48550/arxiv.2506.108577' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","detected_doi":"10.48550/arxiv.2506.108577","detected_arxiv_id":null,"ref_index":49,"audited_at":"2026-05-20T00:12:39.924367Z"}],"snapshot_sha256":"02a92771ad509214c68bd4dca09b79de48bf5565ee5784d7affdf63c306f37f3"},"events":[{"event_id":3804,"event_type":"pith.integrity.v1","payload_sha256":"2293c0e0ebcbfd809cd019b0dd148ec9e3f7bf52e4b51621ed713c447cb3a121","signature_b64":"AVhOc0I5yhd0PV7tDo7OKs55kFUCXoxjCjPvJeyLCbAUDq6Q8g6gxVem8wVBdyJvn2kh8Ck5AiswydvV6uT3DA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.103577+00:00","payload":{"note":"Identifier '10.48550/arxiv.2511.129087' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Zou, J., Xia, H., Ye, Z., Zhang, S., Lai, C., et al.: DeepSport: A multimodal large language model for comprehensive sports video reasoning via agentic reinforcement learning (Nov 2025).https://doi.org/10.48550/arXiv.2511.129087","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2511.129087","arxiv_id":null,"ref_index":55,"raw_excerpt":"Zou, J., Xia, H., Ye, Z., Zhang, S., Lai, C., et al.: DeepSport: A multimodal large language model for comprehensive sports video reasoning via agentic reinforcement learning (Nov 2025).https://doi.org/10.48550/arXiv.2511.129087","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":55,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2511.129087","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"b01746fb6212d3c5e195b912ee002fffa1d7d302b25b0b4cdad9d6ab8434c45e","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3803,"event_type":"pith.integrity.v1","payload_sha256":"e4c7ccf0301cb6abf4dafdf2d978eed9a482389036fae3a9c6f9de30d0b8a8e5","signature_b64":"syGUr9ZpCOUiPMpYdZ9t6ReXqKryHjmhI97zT9dgzKM8+A1M4Q2VDxb37nTq1Iy+lm5mj/IKBv2/X6aLYqIdDw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.101245+00:00","payload":{"note":"Identifier '10.48550/arxiv.2409.165972' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Zhang, J., Jiao, Y., Chen, S., Zhao, N., Tan, Z., et al.: Eventhallusion: Diagnosing event hallucinations in video llms. arXiv preprint arXiv:2409.16597 (2024).https: //doi.org/10.48550/arXiv.2409.165972","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2409.165972","arxiv_id":null,"ref_index":52,"raw_excerpt":"Zhang, J., Jiao, Y., Chen, S., Zhao, N., Tan, Z., et al.: Eventhallusion: Diagnosing event hallucinations in video llms. arXiv preprint arXiv:2409.16597 (2024).https: //doi.org/10.48550/arXiv.2409.165972","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":52,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2409.165972","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"188cb48f637031784f45bb3958d8d94765ff3286edb1e9f8876aecfdb6b9322b","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3802,"event_type":"pith.integrity.v1","payload_sha256":"dea5adfb23c032144d33606de69dff8fe55643f5bf7af7ce6f5f993e0147103d","signature_b64":"mSMWoL4HF37dkMiJDoCBdXkpHBeCyGMevCZTU6V+oT6WwdmcJxr4EVHxM99IGLtta38UFWmrQV/8f7vl5UpOCQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.099061+00:00","payload":{"note":"Identifier '10.48550/arxiv.2508.044164' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Zhang, H., Gu, X., Li, J., Ma, C., Bai, S., et al.: Thinking with videos: Multimodal tool-augmented reinforcement learning for long video reasoning (Sep 2025).https: //doi.org/10.48550/arXiv.2508.044164","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2508.044164","arxiv_id":null,"ref_index":51,"raw_excerpt":"Zhang, H., Gu, X., Li, J., Ma, C., Bai, S., et al.: Thinking with videos: Multimodal tool-augmented reinforcement learning for long video reasoning (Sep 2025).https: //doi.org/10.48550/arXiv.2508.044164","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":51,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2508.044164","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"11c13ebf465f0c3ca6eb35b6972bd8d8fb011af080fa01ca59db46dfa6ddce26","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3801,"event_type":"pith.integrity.v1","payload_sha256":"4990550fd6eb065e7f29da5657ea15c454bfb44373f3b0fe260415d62a07e548","signature_b64":"6c+EBfnmLNq/RHJJFIWRqMvHOxL1HJErXKZX57kzjhYmPauukyIyQm0LJP07TgmRymzkDqGNstY49+chiF4eCA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.096452+00:00","payload":{"note":"Identifier '10.18653/v1/2023.emnlp-demo.4911' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Zhang, H., Li, X., Bing, L.: Video-LLaMA: An instruction-tuned audio-visual lan- guage model for video understanding. In: Feng, Y., Lefever, E. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing: S","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.18653/v1/2023.emnlp-demo.4911","arxiv_id":null,"ref_index":50,"raw_excerpt":"Zhang, H., Li, X., Bing, L.: Video-LLaMA: An instruction-tuned audio-visual lan- guage model for video understanding. In: Feng, Y., Lefever, E. (eds.) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing: System Demonstrations. pp. 543–553. Association for Computational Linguistics, Singapore (Dec 2023).https://doi.org/10.18653/v1/2023.emnlp-demo.4911","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":50,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.18653/v1/2023.emnlp-demo.4911","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"4a4a17eb6437b15e942ad7014ba5d99e1fa0872bccab38461241074b4a38be98","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3800,"event_type":"pith.integrity.v1","payload_sha256":"3e196f4d539dea305082e50a0cd14d576bb606d5c428a3f2bc601056c65186f6","signature_b64":"sgQv1HAaHhZRo+beX/sjxW9p9gx8z25CsSsCWfk5mh74/Vl9vCsJucM4s3xnRxYFAq7gnwbEkOxqkU2e+9iQBw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.094485+00:00","payload":{"note":"Identifier '10.48550/arxiv.2506.108577' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Yu, J., Wu, Y., Chu, M., Ren, Z., Huang, Z., et al.: VRBench: A Benchmark for Multi-Step Reasoning in Long Narrative Videos (Aug 2025).https://doi.org/ 10.48550/arXiv.2506.108577","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2506.108577","arxiv_id":null,"ref_index":49,"raw_excerpt":"Yu, J., Wu, Y., Chu, M., Ren, Z., Huang, Z., et al.: VRBench: A Benchmark for Multi-Step Reasoning in Long Narrative Videos (Aug 2025).https://doi.org/ 10.48550/arXiv.2506.108577","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":49,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2506.108577","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"a2d2718a7fa2b0c0795366c4738b0059b2ba91891857871c8990ca77c2e9e7a2","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3799,"event_type":"pith.integrity.v1","payload_sha256":"8e1714c76d390e6dc258c64ba8c6836bfc5dc59b99915300a241c6cd303279d5","signature_b64":"91+7iWI4J6a/HfWW1482PY+T8SfodfWUeihBS9owZkXUp6MnBUbDPYx/WGkEvP0yMIRF5ew9Qk3Bud/9TQ/sAw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.092367+00:00","payload":{"note":"Identifier '10.48550/arxiv.2511.207854' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Yang, Z., Wang, S., Zhang, K., Wu, K., Leng, S., et al.: LongVT: Incentivizing \"thinking with long videos\" via native tool calling (Nov 2025).https://doi.org/ 10.48550/arXiv.2511.207854","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2511.207854","arxiv_id":null,"ref_index":45,"raw_excerpt":"Yang, Z., Wang, S., Zhang, K., Wu, K., Leng, S., et al.: LongVT: Incentivizing \"thinking with long videos\" via native tool calling (Nov 2025).https://doi.org/ 10.48550/arXiv.2511.207854","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":45,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2511.207854","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"9de9bee1007efe70942b8ab932057f7483896534dc9bae6b4f53a87f4e1fcdf8","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3798,"event_type":"pith.integrity.v1","payload_sha256":"d9c0719fc6a5470e1b126d7c817e29c4e9c9eb1762b4593851c035d76f4a6cbf","signature_b64":"LAYPSNkgit8e7twGEltH8OLlErJGd00EktYG3TsA4ObZYrib28/OIBDfhWbqtmJR8ts8LW9Fm8edp6r9aLMRBQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.090102+00:00","payload":{"note":"Identifier '10.48550/arxiv.2503.1894314' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Xu, M., Gao, M., Li, S., Lu, J., Gan, Z., et al.: SlowFast-LLaVA-1.5: A family of token-efficient video large language models for long-form video understanding (Mar 2025).https://doi.org/10.48550/arXiv.2503.1894314","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2503.1894314","arxiv_id":null,"ref_index":43,"raw_excerpt":"Xu, M., Gao, M., Li, S., Lu, J., Gan, Z., et al.: SlowFast-LLaVA-1.5: A family of token-efficient video large language models for long-form video understanding (Mar 2025).https://doi.org/10.48550/arXiv.2503.1894314","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":43,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2503.1894314","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"5d2f29a2c924cb578b988e12f5cbdcb9c73777421c5825cb1d19a3172356b2a9","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3797,"event_type":"pith.integrity.v1","payload_sha256":"7dabbd1f2cd594c46e5280d93f4ff5d6082334123a8b0e35055bbcd9d55c24eb","signature_b64":"NkkdJUVT13tzL1IAA6dQeJoEcKLYlasrJj9J9lNSMBhyUlUO80z+vK0e6rvsGKlg3YYsYyP3MqlqjkKq59oGAg==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.087985+00:00","payload":{"note":"Identifier '10.48550/arxiv.2410.084744' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Xia, H., Yang, Z., Zou, J., Tracy, R., Wang, Y., et al.: SPORTU: A comprehen- sive sports understanding benchmark for multimodal large language models (Mar 2025).https://doi.org/10.48550/arXiv.2410.084744, 7","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2410.084744","arxiv_id":null,"ref_index":41,"raw_excerpt":"Xia, H., Yang, Z., Zou, J., Tracy, R., Wang, Y., et al.: SPORTU: A comprehen- sive sports understanding benchmark for multimodal large language models (Mar 2025).https://doi.org/10.48550/arXiv.2410.084744, 7","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":41,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2410.084744","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"c096b72977a9e3a33940641442c2b78261e0955e2cf7ca0e9c92b6270b85f577","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3796,"event_type":"pith.integrity.v1","payload_sha256":"90008bbd48ac4ce8759145310001ede8352190d6bd06100ff486c8ba5d32f719","signature_b64":"ZiO0A4m1jOVZryDW/KY3Q1jmETxZL5Jhn1ed+h+as0Et1Nci83/p3pgecE6LIaxO7OczZIj1ZV7aBNK++sNuBw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.085811+00:00","payload":{"note":"Identifier '10.48550/arxiv.2402.158622' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Xia, H., Yang, Z., Wang, Y., Tracy, R., Zhao, Y., et al.: SportQA: A benchmark for sports understanding in large language models (Jun 2024).https://doi.org/ 10.48550/arXiv.2402.158622, 4, 7","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2402.158622","arxiv_id":null,"ref_index":40,"raw_excerpt":"Xia, H., Yang, Z., Wang, Y., Tracy, R., Zhao, Y., et al.: SportQA: A benchmark for sports understanding in large language models (Jun 2024).https://doi.org/ 10.48550/arXiv.2402.158622, 4, 7","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":40,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2402.158622","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"387720df95a4cf3fca325a17649f2a64378a259170d4919387ae77e5bfd353bf","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3795,"event_type":"pith.integrity.v1","payload_sha256":"a04b793b70e53bf0b445758f9304effb0d4b0dee605e1672915c23af58300ba4","signature_b64":"gNEM60nv1QmMy6fky+JtGueh6gBpPG22smZX7GG/M8gtYKguxKxwpK+m5kBNJKkT08UT+LanNpBNkTXPQkNdAw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.083060+00:00","payload":{"note":"Identifier '10.48550/arxiv.2511.064994' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Xia, H., Ge, H., Zou, J., Choi, H.W., Zhang, X., et al.: SportR: A benchmark for multimodal large language model reasoning in sports (Nov 2025).https://doi. org/10.48550/arXiv.2511.064994, 7","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2511.064994","arxiv_id":null,"ref_index":39,"raw_excerpt":"Xia, H., Ge, H., Zou, J., Choi, H.W., Zhang, X., et al.: SportR: A benchmark for multimodal large language model reasoning in sports (Nov 2025).https://doi. org/10.48550/arXiv.2511.064994, 7","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":39,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2511.064994","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"4e80bf94c3555601f081d25566b86f1958c4d966cb25cf635ab9ba70719fe5e6","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3794,"event_type":"pith.integrity.v1","payload_sha256":"7ef12d364c4292b30ba51b1ac820723286df7f95b67827218edfcf6ced5ead90","signature_b64":"Q2yV7Qu5T6zcER0u4cVDMRbZwkNKfkpvLgB6S67N2h5EJWAtoUphAq8RV0NmCuxssUq2nSpx552emmVF7QsnCA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.080437+00:00","payload":{"note":"Identifier '10.48550/arxiv.2510.182349' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Wei, H., Sun, Y., Li, Y.: DeepSeek-OCR: Contexts optical compression (Oct 2025). https://doi.org/10.48550/arXiv.2510.182349","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2510.182349","arxiv_id":null,"ref_index":36,"raw_excerpt":"Wei, H., Sun, Y., Li, Y.: DeepSeek-OCR: Contexts optical compression (Oct 2025). https://doi.org/10.48550/arXiv.2510.182349","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":36,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2510.182349","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"461f65a080b4b751c36672c39074fe1d01de3c23b10a2bac7b44d607c99ad2d3","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3793,"event_type":"pith.integrity.v1","payload_sha256":"8c8d8d7c4c68f6e0fe6d88ce6a4551a07e0c90111d8578dcda70d6cbae773910","signature_b64":"44lLV4FNfdXx7QtXWkieDl+SNcjNvNMNkFMg0hIa5D1jOzISVwTAnmOmpWGIuqW5omtzdJFlnBmPn0TWG7ZrDQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.077661+00:00","payload":{"note":"Identifier '10.48550/arxiv.2406.163382' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Wang, Y., Wang, Y., Zhao, D., Xie, C., Zheng, Z.: VideoHallucer: Evaluating intrinsic and extrinsic hallucinations in large video-language models (Jun 2024). https://doi.org/10.48550/arXiv.2406.163382","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2406.163382","arxiv_id":null,"ref_index":35,"raw_excerpt":"Wang, Y., Wang, Y., Zhao, D., Xie, C., Zheng, Z.: VideoHallucer: Evaluating intrinsic and extrinsic hallucinations in large video-language models (Jun 2024). https://doi.org/10.48550/arXiv.2406.163382","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":35,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2406.163382","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"dea001eca17533469910ae1d1699a81aab96dbaaed8eb38c959f152451d035e3","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3792,"event_type":"pith.integrity.v1","payload_sha256":"2f6d69f8ae53e6c69698853f446268fd63c3b0dd54d51dbfe29f4dd265ab2832","signature_b64":"siGbSWymPx74Jw+tPNecIU/pQCAJC5hafo78rYazIww4852+6AB+JKH3cdLFnizlaMBXaBlA4c/1/TIm5BQzBQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.075378+00:00","payload":{"note":"Identifier '10.48550/arxiv.2507.133534' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Wang, S., Chen, G., Huang, D.a., Li, Z., Li, M., et al.: VideoITG: Multimodal video understanding with instructed temporal grounding (Jul 2025).https://doi.org/ 10.48550/arXiv.2507.133534","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2507.133534","arxiv_id":null,"ref_index":32,"raw_excerpt":"Wang, S., Chen, G., Huang, D.a., Li, Z., Li, M., et al.: VideoITG: Multimodal video understanding with instructed temporal grounding (Jul 2025).https://doi.org/ 10.48550/arXiv.2507.133534","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":32,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2507.133534","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"73ee4abcb05279318ebbe6b1924698f658ab8063ecfdebc3d1f381db0e7420dc","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3791,"event_type":"pith.integrity.v1","payload_sha256":"b5c38b7036ada4eae8cdea09e46d74cb5b8d7de0d2e601671ee54216171c45a9","signature_b64":"rZklbLuKKGeLIgoorFLW7GJHjrZUgrNNYcjzWhD0a3Jo9NDT3yTfsbJpHRRQbalLjP66PfLEi90W14gkhH/OCQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.073028+00:00","payload":{"note":"Identifier '10.48550/arxiv.2410.032904' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Wang, H., Xu, Z., Cheng, Y., Diao, S., Zhou, Y., et al.: Grounded-VideoLLM: Sharpening fine-grained temporal grounding in video large language models (Aug 2025).https://doi.org/10.48550/arXiv.2410.032904","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2410.032904","arxiv_id":null,"ref_index":31,"raw_excerpt":"Wang, H., Xu, Z., Cheng, Y., Diao, S., Zhou, Y., et al.: Grounded-VideoLLM: Sharpening fine-grained temporal grounding in video large language models (Aug 2025).https://doi.org/10.48550/arXiv.2410.032904","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":31,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2410.032904","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"72b0af9ee08d1acbda4382ddf6ce4ce663d0c8c1809fb16690d489391140edb0","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3790,"event_type":"pith.integrity.v1","payload_sha256":"7237aa6aaf29c2cae7434129dfe6dce4e16f9ef638c23aec5b180db30fe71d7f","signature_b64":"35htSiyS9hJ5ppfw4RdDCnxZJkSNAyA34XdH3AhTQ8rl8NPKQ+PYyPXcy1FlLdJVPwpNQRaB9ERQ+i6lS510Aw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.070168+00:00","payload":{"note":"Identifier '10.48550/arxiv.2512.055134' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Sugandhika, C., Li, C., Rajan, D., Fernando, B.: Know-show: Benchmarking video- language models on spatio-temporal grounded reasoning (Dec 2025).https://doi. org/10.48550/arXiv.2512.055134","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2512.055134","arxiv_id":null,"ref_index":28,"raw_excerpt":"Sugandhika, C., Li, C., Rajan, D., Fernando, B.: Know-show: Benchmarking video- language models on spatio-temporal grounded reasoning (Dec 2025).https://doi. org/10.48550/arXiv.2512.055134","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":28,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2512.055134","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"5b17bb8feecd13e2fc4264fbb4136521c46bca90052a408320aecc65bab55342","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3789,"event_type":"pith.integrity.v1","payload_sha256":"2c43a6ca31e03eb823871d5f862f8e0e3c328f6e5e926a43736bed8e5a369546","signature_b64":"J/W11eAwSNkheqMryBS4sULbH/AL0Y3cmPskOJMMl/MwxBoFqwGqb8/G5R01QvY+LusGjCBre0K59GEiFrI/Bw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.067660+00:00","payload":{"note":"Identifier '10.48550/arxiv.2402.0330013' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Shao, Z., Wang, P., Zhu, Q., Xu, R., Song, J., et al.: DeepSeekMath: Pushing the limits of mathematical reasoning in open language models (Apr 2024).https: //doi.org/10.48550/arXiv.2402.0330013","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2402.0330013","arxiv_id":null,"ref_index":27,"raw_excerpt":"Shao, Z., Wang, P., Zhu, Q., Xu, R., Song, J., et al.: DeepSeekMath: Pushing the limits of mathematical reasoning in open language models (Apr 2024).https: //doi.org/10.48550/arXiv.2402.0330013","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":27,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2402.0330013","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"74291dc5644e9e9009635e02af481524672836559b54bf4628ae209bf57ec614","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3788,"event_type":"pith.integrity.v1","payload_sha256":"94998b6596145680a1c2bba6669eea0ef70596decb126db93daf1aca48d970cf","signature_b64":"XvXrRHqkRmIvs8Y7DTJ5OCsvb+xHTTuH2k/qPpmfSAftOmHA+NlqIqqrTsKvGE3avFrUzVB6RGJOrqBBvMgSDw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.065178+00:00","payload":{"note":"Identifier '10.48550/arxiv.2508.1173712' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Lu, S., Li, Y., Xia, Y., Hu, Y., Zhao, S., et al.: Ovis2.5 technical report (Aug 2025). https://doi.org/10.48550/arXiv.2508.1173712","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2508.1173712","arxiv_id":null,"ref_index":21,"raw_excerpt":"Lu, S., Li, Y., Xia, Y., Hu, Y., Zhao, S., et al.: Ovis2.5 technical report (Aug 2025). https://doi.org/10.48550/arXiv.2508.1173712","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":21,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2508.1173712","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"71839a25e87db2f43b79623843854e43b4153896e071dec37bb3ca04ea4dae57","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3787,"event_type":"pith.integrity.v1","payload_sha256":"3843f81f9d1396597f5d431626f0da94751cb930718896a2693acdcd91b2646d","signature_b64":"vHj3yvwbY67FNU+S7r2Z/6JkPZzw44My2fObn+sWw/pS4oepfZ7Ed3P5NLBUcqHEymnaM0FByh3PfyyvToOeBA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.062722+00:00","payload":{"note":"Identifier '10.1007/978-3-031-72652-1_64' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Liu, H., Ma, X., Zhong, C., Zhang, Y., Lin, W.: TimeCraft: Navigate weakly- supervised temporal grounded video question answering via bi-directional reason- ing. In: Leonardis, A., Ricci, E., Roth, S., Russakovsky, O., Sattler, T., Varol, G","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.1007/978-3-031-72652-1_64","arxiv_id":null,"ref_index":19,"raw_excerpt":"Liu, H., Ma, X., Zhong, C., Zhang, Y., Lin, W.: TimeCraft: Navigate weakly- supervised temporal grounded video question answering via bi-directional reason- ing. In: Leonardis, A., Ricci, E., Roth, S., Russakovsky, O., Sattler, T., Varol, G. (eds.) Computer Vision – ECCV 2024, vol. 15063. Springer Nature Switzerland, Cham (2025).https://doi.org/10.1007/978-3-031-72652-1_64","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":19,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.1007/978-3-031-72652-1_64","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"d363237e65d0a2917ebfe1a49ca783a3758bdb48e1ab33c402323f206274f5dd","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3786,"event_type":"pith.integrity.v1","payload_sha256":"3205998f83b4356b49758e2b5441fe166a515ebde6e34136bc627bc67ea7d6ea","signature_b64":"YXD8xePOBFl48MN9HzGJLESa6zFz+STAX/B5RpQI0pB3HoPsZ2Uouc+zk5YXMzm8eXopZuiNr8RgVUztApq7BA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.060072+00:00","payload":{"note":"Identifier '10.1109/iccv51070.2023.012752' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Li, Y., Xiao, J., Feng, C., Wang, X., Chua, T.S.: Discovering spatio-temporal ratio- nales for video question answering. In: 2023 IEEE/CVF International Conference on Computer Vision (ICCV). pp. 13823–13832. IEEE, Paris, France (Oct 2023). ","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.1109/iccv51070.2023.012752","arxiv_id":null,"ref_index":18,"raw_excerpt":"Li, Y., Xiao, J., Feng, C., Wang, X., Chua, T.S.: Discovering spatio-temporal ratio- nales for video question answering. In: 2023 IEEE/CVF International Conference on Computer Vision (ICCV). pp. 13823–13832. IEEE, Paris, France (Oct 2023). https://doi.org/10.1109/ICCV51070.2023.012752","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":18,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.1109/iccv51070.2023.012752","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"cbfca855fdd55eb811187f6b8a83058f00993b362522fcc66aaf22363171c8f7","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3785,"event_type":"pith.integrity.v1","payload_sha256":"ffb138b8374585c6e87364bf7ea30c4b9df595c0686a6df6f14065e3a8695a5b","signature_b64":"lg94ng+F04tRWy2CEcf4bvUMLSYOnNvhWvYE2Ktt8coLSV0cES2objq14h9KlKc2cZOxXjuJ+hW9ignXq6+LBA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.055554+00:00","payload":{"note":"Identifier '10.48550/arxiv.2501.139194' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Li, R., Wang, X., Zhang, Y., Zohar, O., Wang, Z., et al.: Temporal Preference Optimization for Long-Form Video Understanding (Sep 2025).https://doi.org/ 10.48550/arXiv.2501.139194","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2501.139194","arxiv_id":null,"ref_index":17,"raw_excerpt":"Li, R., Wang, X., Zhang, Y., Zohar, O., Wang, Z., et al.: Temporal Preference Optimization for Long-Form Video Understanding (Sep 2025).https://doi.org/ 10.48550/arXiv.2501.139194","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":17,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2501.139194","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"a7ecf3944c0bb73232ae8eb50a73adde1434a59d0de82a5caab7825ed0635a83","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3784,"event_type":"pith.integrity.v1","payload_sha256":"cd6275a7f8807ee2f732297ea6784b70e3aa88dd8a27af3d7342e8d4399237b9","signature_b64":"vukU1HUfEf/t01SYBZDwShvNiepCp2y33avXRktaSXOFZ3hwcuXGhv1jUqmuUyvkkH6w8IYl08kb6WoD8JiLDQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.053245+00:00","payload":{"note":"Identifier '10.48550/arxiv.2401.015057' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Li,H.,Deng,A.,Ke,Q.,Liu,J.,Rahmani,H.,etal.:Sports-QA:Alarge-scalevideo question answering benchmark for complex and professional sports (Jan 2024). https://doi.org/10.48550/arXiv.2401.015057","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2401.015057","arxiv_id":null,"ref_index":16,"raw_excerpt":"Li,H.,Deng,A.,Ke,Q.,Liu,J.,Rahmani,H.,etal.:Sports-QA:Alarge-scalevideo question answering benchmark for complex and professional sports (Jan 2024). https://doi.org/10.48550/arXiv.2401.015057","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":16,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2401.015057","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"0116b1c302f84c9bf16c2bacd85dbeff938f04067aeb69c83c309c945572e180","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3783,"event_type":"pith.integrity.v1","payload_sha256":"f28465e5a6e0bcf0f5c196094d68b92801b817bcb3558d6edd71d4092990ebbb","signature_b64":"D9E02+M38WUozs6leGRgvGz47a2tNwX0afl83W3oTPclfjvKIGRNCCzs3/BWcrvCa/fZEy0IvM7UFPFXkkMWBg==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.050617+00:00","payload":{"note":"Identifier '10.48550/arxiv.2506.094454' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Gupta, A., Roy, A., Chellappa, R., Bastian, N.D., Velasquez, A., et al.: TOGA: Temporally grounded open-ended video QA with weak supervision (Jun 2025). https://doi.org/10.48550/arXiv.2506.094454","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2506.094454","arxiv_id":null,"ref_index":12,"raw_excerpt":"Gupta, A., Roy, A., Chellappa, R., Bastian, N.D., Velasquez, A., et al.: TOGA: Temporally grounded open-ended video QA with weak supervision (Jun 2025). https://doi.org/10.48550/arXiv.2506.094454","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":12,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2506.094454","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"7944f49b7e3a04f5411a9c5f9f445dd6ac86850fa7071dd54dace38e028a0d14","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3782,"event_type":"pith.integrity.v1","payload_sha256":"7c4a38fd4535d29bda2ec706ed226a371dc5ec1fb5419df436a33453bc413616","signature_b64":"/L1mVdPd3WrCbjP7wGZEelXTejD1AEnDxwiQxtyCJcZGG9Obyu7v4oNM0Ly7RXxYyA9IoQOLMJ4YxoVoeCfmCQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.047972+00:00","payload":{"note":"Identifier '10.48550/arxiv.2601.106111' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Clark, C., Zhang, J., Ma, Z., Park, J.S., Salehi, M., et al.: Molmo2: Open Weights and Data for Vision-Language Models with Video Understanding and Grounding (Jan 2026).https://doi.org/10.48550/arXiv.2601.106111","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2601.106111","arxiv_id":null,"ref_index":5,"raw_excerpt":"Clark, C., Zhang, J., Ma, Z., Park, J.S., Salehi, M., et al.: Molmo2: Open Weights and Data for Vision-Language Models with Video Understanding and Grounding (Jan 2026).https://doi.org/10.48550/arXiv.2601.106111","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":5,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2601.106111","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"c0ae00a6c5affb09a482337ef459eb00996c240efb98a4a39835705992ab7215","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3781,"event_type":"pith.integrity.v1","payload_sha256":"e7d804349a230b68f00fe07541a648b52513731744922b8648fa8d621c1eadc8","signature_b64":"l4vZCj+EQ1W3OHc+bZAq22RwwjYS9086fMOC4SB89avoS1Jwig3F2rgqLIOyKR8LCP6okWp26tUX79Ol/KZSBw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.045073+00:00","payload":{"note":"Identifier '10.48550/arxiv.2412.0527111' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Chen, Z., Wang, W., Cao, Y., Liu, Y., Gao, Z., et al.: Expanding Performance Boundaries of Open-Source Multimodal Models with Model, Data, and Test-Time Scaling (Sep 2025).https://doi.org/10.48550/arXiv.2412.0527111, 12","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2412.0527111","arxiv_id":null,"ref_index":4,"raw_excerpt":"Chen, Z., Wang, W., Cao, Y., Liu, Y., Gao, Z., et al.: Expanding Performance Boundaries of Open-Source Multimodal Models with Model, Data, and Test-Time Scaling (Sep 2025).https://doi.org/10.48550/arXiv.2412.0527111, 12","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":4,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2412.0527111","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"ee51a61a409e5055063cf87f785b498934828e86cae108b1d28e963a0d4ed319","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3780,"event_type":"pith.integrity.v1","payload_sha256":"d2af6468cf3130936c7b8920d51c0b4af1accd0bac3604c282b05107fe56fb5f","signature_b64":"Oq/i7Ix/aLuwvvFqf78TiPxS2tQ4pfcVETpO+kRRQh0P8dj+N89SV5+xPNBs6IboAtna66lgnMJX5hqyMdgOCQ==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.041734+00:00","payload":{"note":"Identifier '10.48550/arxiv.2412.120752' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Chen, G., Liu, Y., Huang, Y., He, Y., Pei, B., et al.: CG-bench: Clue-grounded question answering benchmark for long video understanding (Dec 2024).https: //doi.org/10.48550/arXiv.2412.120752, 4","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2412.120752","arxiv_id":null,"ref_index":3,"raw_excerpt":"Chen, G., Liu, Y., Huang, Y., He, Y., Pei, B., et al.: CG-bench: Clue-grounded question answering benchmark for long video understanding (Dec 2024).https: //doi.org/10.48550/arXiv.2412.120752, 4","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":3,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2412.120752","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"a33323f48d2835cd84cd2ffa4c4799cac6246a55505983c87a010d344c90c8e0","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3779,"event_type":"pith.integrity.v1","payload_sha256":"04b0fe8f33752e8dc76f862108f5c89bed40c0a9f48aaa1824b1eb08cfa73c7d","signature_b64":"+1laMsiEejauk2GCD7ZMSkMixKntlB3DrAEsZVLNZFuPO9fJv+6uxJ7WjVNCx+KR5ZmdbOurkEZPIBX3HEKsCA==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.035838+00:00","payload":{"note":"Identifier '10.48550/arxiv.2511.216311' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"Bai, S., Cai, Y., Chen, R., Chen, K., Chen, X., et al.: Qwen3-VL technical report (2025).https://doi.org/10.48550/ARXIV.2511.216311, 11","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2511.216311","arxiv_id":null,"ref_index":2,"raw_excerpt":"Bai, S., Cai, Y., Chen, R., Chen, K., Chen, X., et al.: Qwen3-VL technical report (2025).https://doi.org/10.48550/ARXIV.2511.216311, 11","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":2,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2511.216311","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"0294cb3c48c563797484060f753d3624822d7b1b8bea80f26a7f969934b5ea83","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}},{"event_id":3778,"event_type":"pith.integrity.v1","payload_sha256":"92e75b2d3ca87b5b4e203bedfd13cd65da51860f759699268cd1dd48969b6bd9","signature_b64":"J65AGzbhv4KrTXZnMzRKHEQFnBK9y369h05ylgkWnLzuHd8RduyA2CAO10+ZxMjb3lWCocYuBy1IywzZPk1fAw==","signing_key_id":"pith-v1-2026-05","created_at":"2026-05-20T00:17:29.028270+00:00","payload":{"note":"Identifier '10.48550/arxiv.2509.2366112' is syntactically valid but the DOI registry (doi.org) returned 404, and Crossref / OpenAlex / internal corpus also have no record. The cited work could not be located through any authoritative source.","snippet":"An, X., Xie, Y., Yang, K., Zhang, W., Zhao, X., et al.: LLaVA-OneVision-1.5: Fully open framework for democratized multimodal training (Dec 2025).https: //doi.org/10.48550/arXiv.2509.2366112","arxiv_id":"2604.22226","detector":"doi_compliance","evidence":{"doi":"10.48550/arxiv.2509.2366112","arxiv_id":null,"ref_index":1,"raw_excerpt":"An, X., Xie, Y., Yang, K., Zhang, W., Zhao, X., et al.: LLaVA-OneVision-1.5: Fully open framework for democratized multimodal training (Dec 2025).https: //doi.org/10.48550/arXiv.2509.2366112","verdict_class":"cross_source","checked_sources":["crossref_by_doi","openalex_by_doi","doi_org_head"]},"severity":"critical","ref_index":1,"audited_at":"2026-05-20T00:12:39.924367Z","event_type":"pith.integrity.v1","detected_doi":"10.48550/arxiv.2509.2366112","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"unresolvable_identifier","evidence_hash":"c89d755d09b7646b411d158002a8872ea048b091463d5d892c60aa27f96bbabd","paper_version":1,"verdict_class":"cross_source","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null}}],"endpoint_self":"/pith/2604.22226/integrity.json","protocol_url":"https://pith.science/pith-integrity-protocol"}