{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:XGAGX6ALLNDR3VI7B6WH3IZ534","short_pith_number":"pith:XGAGX6AL","schema_version":"1.0","canonical_sha256":"b9806bf80b5b471dd51f0fac7da33ddf2f9c8c3ec58b0eb50654d709bc9e7b4e","source":{"kind":"arxiv","id":"2607.01751","version":1},"attestation_state":"computed","paper":{"title":"MedStreamBench: A Time-Aware Benchmark for Streaming and Proactive Medical Video Understanding","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Shujian Gao, Songtao Jiang, Yuan Wang, Zhengyu Hu, Zuozhu Liu","submitted_at":"2026-07-02T06:07:44Z","abstract_excerpt":"Existing medical video benchmarks primarily evaluate whether a model produces the correct answer, but rarely assess whether it answers at the right time. In real clinical settings, AI systems must decide not only what to predict, but also when to answer, defer judgment, or proactively raise alerts. This creates a critical gap between benchmark evaluation and deployment requirements. We present MedStreamBench, a benchmark for time-aware medical video understanding. MedStreamBench integrates 22 medical datasets and 5,419 QA instances across four temporal settings: retrospective, present, future,"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2607.01751","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-07-02T06:07:44Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"8dc3a9db204cf31c5ab1ab7929c49b6971b0cb55c60db86837ede4dfc74fc6aa","abstract_canon_sha256":"57bb897c31af3d3d96c474fb39ddcae601c40108dc55f86f71f666c02174e4bd"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-03T01:17:28.488024Z","signature_b64":"mNE04qY2NKmwUg3c4nKC7/i12CYwAtzWxQ5PyWKr9L3EK+Ba4WDWkdeAVW/a0Ogvvo4X40ib23GgyfC0xqgEDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b9806bf80b5b471dd51f0fac7da33ddf2f9c8c3ec58b0eb50654d709bc9e7b4e","last_reissued_at":"2026-07-03T01:17:28.487625Z","signature_status":"signed_v1","first_computed_at":"2026-07-03T01:17:28.487625Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"MedStreamBench: A Time-Aware Benchmark for Streaming and Proactive Medical Video Understanding","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CV","authors_text":"Shujian Gao, Songtao Jiang, Yuan Wang, Zhengyu Hu, Zuozhu Liu","submitted_at":"2026-07-02T06:07:44Z","abstract_excerpt":"Existing medical video benchmarks primarily evaluate whether a model produces the correct answer, but rarely assess whether it answers at the right time. In real clinical settings, AI systems must decide not only what to predict, but also when to answer, defer judgment, or proactively raise alerts. This creates a critical gap between benchmark evaluation and deployment requirements. We present MedStreamBench, a benchmark for time-aware medical video understanding. MedStreamBench integrates 22 medical datasets and 5,419 QA instances across four temporal settings: retrospective, present, future,"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2607.01751","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2607.01751/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2607.01751","created_at":"2026-07-03T01:17:28.487688+00:00"},{"alias_kind":"arxiv_version","alias_value":"2607.01751v1","created_at":"2026-07-03T01:17:28.487688+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2607.01751","created_at":"2026-07-03T01:17:28.487688+00:00"},{"alias_kind":"pith_short_12","alias_value":"XGAGX6ALLNDR","created_at":"2026-07-03T01:17:28.487688+00:00"},{"alias_kind":"pith_short_16","alias_value":"XGAGX6ALLNDR3VI7","created_at":"2026-07-03T01:17:28.487688+00:00"},{"alias_kind":"pith_short_8","alias_value":"XGAGX6AL","created_at":"2026-07-03T01:17:28.487688+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534","json":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534.json","graph_json":"https://pith.science/api/pith-number/XGAGX6ALLNDR3VI7B6WH3IZ534/graph.json","events_json":"https://pith.science/api/pith-number/XGAGX6ALLNDR3VI7B6WH3IZ534/events.json","paper":"https://pith.science/paper/XGAGX6AL"},"agent_actions":{"view_html":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534","download_json":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534.json","view_paper":"https://pith.science/paper/XGAGX6AL","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2607.01751&json=true","fetch_graph":"https://pith.science/api/pith-number/XGAGX6ALLNDR3VI7B6WH3IZ534/graph.json","fetch_events":"https://pith.science/api/pith-number/XGAGX6ALLNDR3VI7B6WH3IZ534/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534/action/timestamp_anchor","attest_storage":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534/action/storage_attestation","attest_author":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534/action/author_attestation","sign_citation":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534/action/citation_signature","submit_replication":"https://pith.science/pith/XGAGX6ALLNDR3VI7B6WH3IZ534/action/replication_record"}},"created_at":"2026-07-03T01:17:28.487688+00:00","updated_at":"2026-07-03T01:17:28.487688+00:00"}