{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2024:GPAQLZJYYEKLHJSTWHRXGDCTGT","short_pith_number":"pith:GPAQLZJY","canonical_record":{"source":{"id":"2409.12589","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"hep-ph","submitted_at":"2024-09-19T09:12:29Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"dfae844f67bc4659456a47c7dfcfab59915c9b08fd00805273e5041eaf5c06ed","abstract_canon_sha256":"68cdc2e84a3820c14ba54db8cd90c419bf6d2f03e52f474e3e7514ae615678ac"},"schema_version":"1.0"},"canonical_sha256":"33c105e538c114b3a653b1e3730c5334f378e4e4e795a93fa9f7e13ec117ae84","source":{"kind":"arxiv","id":"2409.12589","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2409.12589","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"arxiv_version","alias_value":"2409.12589v2","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2409.12589","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_12","alias_value":"GPAQLZJYYEKL","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_16","alias_value":"GPAQLZJYYEKLHJST","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_8","alias_value":"GPAQLZJY","created_at":"2026-07-05T09:13:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2024:GPAQLZJYYEKLHJSTWHRXGDCTGT","target":"record","payload":{"canonical_record":{"source":{"id":"2409.12589","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"hep-ph","submitted_at":"2024-09-19T09:12:29Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"dfae844f67bc4659456a47c7dfcfab59915c9b08fd00805273e5041eaf5c06ed","abstract_canon_sha256":"68cdc2e84a3820c14ba54db8cd90c419bf6d2f03e52f474e3e7514ae615678ac"},"schema_version":"1.0"},"canonical_sha256":"33c105e538c114b3a653b1e3730c5334f378e4e4e795a93fa9f7e13ec117ae84","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T09:13:56.985894Z","signature_b64":"Ic1WP/g2u+mUowS/L745Q+WNhtNv3oHc6XU+ZW/SK5im9+CxxQ8jaWCglAt7iPYZFq4XCuNMY/O04FLWSc/RCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"33c105e538c114b3a653b1e3730c5334f378e4e4e795a93fa9f7e13ec117ae84","last_reissued_at":"2026-07-05T09:13:56.985348Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T09:13:56.985348Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2409.12589","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T09:13:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RhW6v4bAg83ld4AgVngMmJa1wRHQhjvzthr9JOWMGt5/Me/guL/pt5cG1T0gEwAbZaYN+TzCOtmLQJGMSzmuCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:55:02.483033Z"},"content_sha256":"e00e0f857d9e2d7aa34340b9f30a2309b3862e8a9884e9d8e521941673386872","schema_version":"1.0","event_id":"sha256:e00e0f857d9e2d7aa34340b9f30a2309b3862e8a9884e9d8e521941673386872"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2024:GPAQLZJYYEKLHJSTWHRXGDCTGT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Is Tokenization Needed for Masked Particle Modelling?","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"hep-ph","authors_text":"Fran\\c{c}ois Charton, In\\^es Ochoa, Lukas Heinrich, Margarita Osadchy, Matthew Leigh, Michael Kagan, Samuel Klein, Tobias Golling","submitted_at":"2024-09-19T09:12:29Z","abstract_excerpt":"In this work, we significantly enhance masked particle modeling (MPM), a self-supervised learning scheme for constructing highly expressive representations of unordered sets relevant to developing foundation models for high-energy physics. In MPM, a model is trained to recover the missing elements of a set, a learning objective that requires no labels and can be applied directly to experimental data. We achieve significant performance improvements over previous work on MPM by addressing inefficiencies in the implementation and incorporating a more powerful decoder. We compare several pre-train"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2409.12589","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2409.12589/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T09:13:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JzV0M/MK53C5kJIkmNKNRHc/GUzEEbs60A70Bl34NrceVCVTtcJWL3E0OxMfYHKut7IeifC7wwwLk5gU+vy6Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:55:02.483699Z"},"content_sha256":"3f8d3263dbd6c2700ae941e2379b04287d09b3a319539a76f69fa77b00bb295f","schema_version":"1.0","event_id":"sha256:3f8d3263dbd6c2700ae941e2379b04287d09b3a319539a76f69fa77b00bb295f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/bundle.json","state_url":"https://pith.science/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T15:55:02Z","links":{"resolver":"https://pith.science/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT","bundle":"https://pith.science/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/bundle.json","state":"https://pith.science/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GPAQLZJYYEKLHJSTWHRXGDCTGT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2024:GPAQLZJYYEKLHJSTWHRXGDCTGT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"68cdc2e84a3820c14ba54db8cd90c419bf6d2f03e52f474e3e7514ae615678ac","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"hep-ph","submitted_at":"2024-09-19T09:12:29Z","title_canon_sha256":"dfae844f67bc4659456a47c7dfcfab59915c9b08fd00805273e5041eaf5c06ed"},"schema_version":"1.0","source":{"id":"2409.12589","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2409.12589","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"arxiv_version","alias_value":"2409.12589v2","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2409.12589","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_12","alias_value":"GPAQLZJYYEKL","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_16","alias_value":"GPAQLZJYYEKLHJST","created_at":"2026-07-05T09:13:56Z"},{"alias_kind":"pith_short_8","alias_value":"GPAQLZJY","created_at":"2026-07-05T09:13:56Z"}],"graph_snapshots":[{"event_id":"sha256:3f8d3263dbd6c2700ae941e2379b04287d09b3a319539a76f69fa77b00bb295f","target":"graph","created_at":"2026-07-05T09:13:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2409.12589/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In this work, we significantly enhance masked particle modeling (MPM), a self-supervised learning scheme for constructing highly expressive representations of unordered sets relevant to developing foundation models for high-energy physics. In MPM, a model is trained to recover the missing elements of a set, a learning objective that requires no labels and can be applied directly to experimental data. We achieve significant performance improvements over previous work on MPM by addressing inefficiencies in the implementation and incorporating a more powerful decoder. We compare several pre-train","authors_text":"Fran\\c{c}ois Charton, In\\^es Ochoa, Lukas Heinrich, Margarita Osadchy, Matthew Leigh, Michael Kagan, Samuel Klein, Tobias Golling","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"hep-ph","submitted_at":"2024-09-19T09:12:29Z","title":"Is Tokenization Needed for Masked Particle Modelling?"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2409.12589","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e00e0f857d9e2d7aa34340b9f30a2309b3862e8a9884e9d8e521941673386872","target":"record","created_at":"2026-07-05T09:13:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"68cdc2e84a3820c14ba54db8cd90c419bf6d2f03e52f474e3e7514ae615678ac","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"hep-ph","submitted_at":"2024-09-19T09:12:29Z","title_canon_sha256":"dfae844f67bc4659456a47c7dfcfab59915c9b08fd00805273e5041eaf5c06ed"},"schema_version":"1.0","source":{"id":"2409.12589","kind":"arxiv","version":2}},"canonical_sha256":"33c105e538c114b3a653b1e3730c5334f378e4e4e795a93fa9f7e13ec117ae84","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"33c105e538c114b3a653b1e3730c5334f378e4e4e795a93fa9f7e13ec117ae84","first_computed_at":"2026-07-05T09:13:56.985348Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T09:13:56.985348Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Ic1WP/g2u+mUowS/L745Q+WNhtNv3oHc6XU+ZW/SK5im9+CxxQ8jaWCglAt7iPYZFq4XCuNMY/O04FLWSc/RCQ==","signature_status":"signed_v1","signed_at":"2026-07-05T09:13:56.985894Z","signed_message":"canonical_sha256_bytes"},"source_id":"2409.12589","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e00e0f857d9e2d7aa34340b9f30a2309b3862e8a9884e9d8e521941673386872","sha256:3f8d3263dbd6c2700ae941e2379b04287d09b3a319539a76f69fa77b00bb295f"],"state_sha256":"1ad4eae978781d2ba13d780aed802406bf6f26903db3d1d92caa56f741afe994"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7CtJRDCPviBBfdiX0UWyGHPGuS/ov0DoulJ2wOMa69BaC4Wh8SLwD0hybnQSW07w9e9XVZlxC6jICAFSO0P/Bg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T15:55:02.487406Z","bundle_sha256":"633f109087fa391ffb3327f7abd2a29035a09ce2d9b949d67c9a8622d65bf84a"}}