{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:WU3V3EIAQN2LRR6KHOT4QYWVEB","short_pith_number":"pith:WU3V3EIA","canonical_record":{"source":{"id":"2509.21013","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-25T11:20:38Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"17eed0607ab8326aec63de59a64dce691af5fdc12223961037ff4ec6b2d5d1a5","abstract_canon_sha256":"21bc5e0796d01ad7d36bb59c387779a2dd1dbe297bf46da5e5c4ab550acf67ed"},"schema_version":"1.0"},"canonical_sha256":"b5375d91008374b8c7ca3ba7c862d52066b27c54cd32346775958ce5842469f0","source":{"kind":"arxiv","id":"2509.21013","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2509.21013","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"arxiv_version","alias_value":"2509.21013v4","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2509.21013","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_12","alias_value":"WU3V3EIAQN2L","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_16","alias_value":"WU3V3EIAQN2LRR6K","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_8","alias_value":"WU3V3EIA","created_at":"2026-07-02T00:18:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:WU3V3EIAQN2LRR6KHOT4QYWVEB","target":"record","payload":{"canonical_record":{"source":{"id":"2509.21013","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-25T11:20:38Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"17eed0607ab8326aec63de59a64dce691af5fdc12223961037ff4ec6b2d5d1a5","abstract_canon_sha256":"21bc5e0796d01ad7d36bb59c387779a2dd1dbe297bf46da5e5c4ab550acf67ed"},"schema_version":"1.0"},"canonical_sha256":"b5375d91008374b8c7ca3ba7c862d52066b27c54cd32346775958ce5842469f0","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-02T00:18:25.207773Z","signature_b64":"aFAXnHXL0NxnlUZbao4Fdx02fpATCmTr1h7eWs7Xmp6L9T9dikurQzGwrKNTSI8dEcoD2eN7I2hjSwPEwRFeDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b5375d91008374b8c7ca3ba7c862d52066b27c54cd32346775958ce5842469f0","last_reissued_at":"2026-07-02T00:18:25.207198Z","signature_status":"signed_v1","first_computed_at":"2026-07-02T00:18:25.207198Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2509.21013","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-02T00:18:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MMNxvS6m65e8IzheDYcAElwuxEtun/rNPfmbytngnV9/aNLZSWek3bT049ZwB5Dx4Eba84BVGB9xmkPG20sPAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T21:01:48.816396Z"},"content_sha256":"a970dcbef1c115cb174adafe1cdd88ab006f4a543a2b9fb1c60187b61bcf30a6","schema_version":"1.0","event_id":"sha256:a970dcbef1c115cb174adafe1cdd88ab006f4a543a2b9fb1c60187b61bcf30a6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:WU3V3EIAQN2LRR6KHOT4QYWVEB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Predicting LLM Reasoning Performance with Small Proxy Model","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Jamin Shin, Juyoung Suk, Se-Young Yun, Sungjun Han, Woosung Koh","submitted_at":"2025-09-25T11:20:38Z","abstract_excerpt":"Given the prohibitive cost of pre-training large language models, it is essential to leverage smaller proxy models to optimize datasets before scaling up. However, this approach becomes challenging for reasoning capabilities, which exhibit emergent behavior that only appear reliably at larger model sizes, often exceeding 7B parameters. To address this, we introduce rBridge, showing that small proxies ($\\leq$1B) can effectively predict large-model reasoning by aligning more closely with (1) the pre-training objective and (2) the target task. rBridge achieves this by weighting negative log-likel"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2509.21013","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2509.21013/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-02T00:18:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"21Y7JZIIGbCZtnB74CsmBcKiQhxSQUX/d/rS8e+w6D9kzzlycNC5+hPL4RyKHUfMx+aMv7iqgxfTAeTXAfyrBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T21:01:48.816772Z"},"content_sha256":"b541b7d0ad74db20e016b78fefaf4d56e887e28ea1e3d3212c1a6a1d7154e9f4","schema_version":"1.0","event_id":"sha256:b541b7d0ad74db20e016b78fefaf4d56e887e28ea1e3d3212c1a6a1d7154e9f4"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/bundle.json","state_url":"https://pith.science/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T21:01:48Z","links":{"resolver":"https://pith.science/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB","bundle":"https://pith.science/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/bundle.json","state":"https://pith.science/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WU3V3EIAQN2LRR6KHOT4QYWVEB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:WU3V3EIAQN2LRR6KHOT4QYWVEB","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"21bc5e0796d01ad7d36bb59c387779a2dd1dbe297bf46da5e5c4ab550acf67ed","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-25T11:20:38Z","title_canon_sha256":"17eed0607ab8326aec63de59a64dce691af5fdc12223961037ff4ec6b2d5d1a5"},"schema_version":"1.0","source":{"id":"2509.21013","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2509.21013","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"arxiv_version","alias_value":"2509.21013v4","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2509.21013","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_12","alias_value":"WU3V3EIAQN2L","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_16","alias_value":"WU3V3EIAQN2LRR6K","created_at":"2026-07-02T00:18:25Z"},{"alias_kind":"pith_short_8","alias_value":"WU3V3EIA","created_at":"2026-07-02T00:18:25Z"}],"graph_snapshots":[{"event_id":"sha256:b541b7d0ad74db20e016b78fefaf4d56e887e28ea1e3d3212c1a6a1d7154e9f4","target":"graph","created_at":"2026-07-02T00:18:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2509.21013/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Given the prohibitive cost of pre-training large language models, it is essential to leverage smaller proxy models to optimize datasets before scaling up. However, this approach becomes challenging for reasoning capabilities, which exhibit emergent behavior that only appear reliably at larger model sizes, often exceeding 7B parameters. To address this, we introduce rBridge, showing that small proxies ($\\leq$1B) can effectively predict large-model reasoning by aligning more closely with (1) the pre-training objective and (2) the target task. rBridge achieves this by weighting negative log-likel","authors_text":"Jamin Shin, Juyoung Suk, Se-Young Yun, Sungjun Han, Woosung Koh","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-25T11:20:38Z","title":"Predicting LLM Reasoning Performance with Small Proxy Model"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2509.21013","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a970dcbef1c115cb174adafe1cdd88ab006f4a543a2b9fb1c60187b61bcf30a6","target":"record","created_at":"2026-07-02T00:18:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"21bc5e0796d01ad7d36bb59c387779a2dd1dbe297bf46da5e5c4ab550acf67ed","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-09-25T11:20:38Z","title_canon_sha256":"17eed0607ab8326aec63de59a64dce691af5fdc12223961037ff4ec6b2d5d1a5"},"schema_version":"1.0","source":{"id":"2509.21013","kind":"arxiv","version":4}},"canonical_sha256":"b5375d91008374b8c7ca3ba7c862d52066b27c54cd32346775958ce5842469f0","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b5375d91008374b8c7ca3ba7c862d52066b27c54cd32346775958ce5842469f0","first_computed_at":"2026-07-02T00:18:25.207198Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-02T00:18:25.207198Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"aFAXnHXL0NxnlUZbao4Fdx02fpATCmTr1h7eWs7Xmp6L9T9dikurQzGwrKNTSI8dEcoD2eN7I2hjSwPEwRFeDw==","signature_status":"signed_v1","signed_at":"2026-07-02T00:18:25.207773Z","signed_message":"canonical_sha256_bytes"},"source_id":"2509.21013","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a970dcbef1c115cb174adafe1cdd88ab006f4a543a2b9fb1c60187b61bcf30a6","sha256:b541b7d0ad74db20e016b78fefaf4d56e887e28ea1e3d3212c1a6a1d7154e9f4"],"state_sha256":"1ed70f07bc0cf85cb6ed4eb12a95b65734e594881fb5bafca45f63ea76bc063f"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9YsOHjhvAmDclIYxcVdl8m8esCj2HzRa6zDGxbbPp5n2c5WxWV//b4Zos+h40hIbhMzCpJTbirpSJH4Z5zh0Aw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T21:01:48.818796Z","bundle_sha256":"de4663a13660bbf563373d0fd97bd2bbb99c5b6f800938d6413181501b94578d"}}