{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2024:EA54DF5YPRNI3UHRFEJWUGWI46","short_pith_number":"pith:EA54DF5Y","canonical_record":{"source":{"id":"2410.15236","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2024-10-20T00:00:56Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"37db135a3f03533ef0eb26641135e9346b3ead7df6bb07b801f8bbd4c0b4132d","abstract_canon_sha256":"6af61dd759e3ecedb66cdf5c91a433db7f65384effae5562a4e00f436a94d139"},"schema_version":"1.0"},"canonical_sha256":"203bc197b87c5a8dd0f129136a1ac8e79ecd09496d518900247482745ef8c813","source":{"kind":"arxiv","id":"2410.15236","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2410.15236","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"arxiv_version","alias_value":"2410.15236v4","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2410.15236","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_12","alias_value":"EA54DF5YPRNI","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_16","alias_value":"EA54DF5YPRNI3UHR","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_8","alias_value":"EA54DF5Y","created_at":"2026-05-29T00:04:12Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2024:EA54DF5YPRNI3UHRFEJWUGWI46","target":"record","payload":{"canonical_record":{"source":{"id":"2410.15236","kind":"arxiv","version":4},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2024-10-20T00:00:56Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"37db135a3f03533ef0eb26641135e9346b3ead7df6bb07b801f8bbd4c0b4132d","abstract_canon_sha256":"6af61dd759e3ecedb66cdf5c91a433db7f65384effae5562a4e00f436a94d139"},"schema_version":"1.0"},"canonical_sha256":"203bc197b87c5a8dd0f129136a1ac8e79ecd09496d518900247482745ef8c813","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T00:04:12.336399Z","signature_b64":"GZdotHQLtBeYodjGHeEU7GTBTDIpQi5CxlZZDUjxPMhZBocFEnDrHZaVtupuzlTwRpVkr7QuV6JBSNOVzP5RCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"203bc197b87c5a8dd0f129136a1ac8e79ecd09496d518900247482745ef8c813","last_reissued_at":"2026-05-29T00:04:12.335728Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T00:04:12.335728Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2410.15236","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T00:04:12Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sNIzw+cplemn6iCnIEormsmz04eyjBESW8Qspcqv2ZqmZJmKX5Hp04LyQXbHXBwTtHhi6epE2hxmDpVQ+CQjDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:40:45.385073Z"},"content_sha256":"e5bea73129380bba4fdf0e730fd37ee3c506b7141e42c5102230dc8109bc2677","schema_version":"1.0","event_id":"sha256:e5bea73129380bba4fdf0e730fd37ee3c506b7141e42c5102230dc8109bc2677"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2024:EA54DF5YPRNI3UHRFEJWUGWI46","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Jailbreaking and Mitigation of Vulnerabilities in Large Language Models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","cs.LG"],"primary_cat":"cs.CR","authors_text":"Benji Peng, Caitlyn Heqi Yin, Hanxuan Chen, Jiacheng Shi, Keyu Chen, Lawrence K.Q. Yan, Ming Liu, Pohsun Feng, Qian Niu, Riyang Bao, Tianyang Wang, Xinyuan Song, Yichao Zhang, Yizhu Wen, Ziqian Bi","submitted_at":"2024-10-20T00:00:56Z","abstract_excerpt":"Large Language Models (LLMs) have transformed artificial intelligence by advancing natural language understanding and generation, enabling applications across fields beyond healthcare, software engineering, and conversational systems. Despite these advancements in the past few years, LLMs have shown considerable vulnerabilities, particularly to prompt injection and jailbreaking attacks. This review analyzes the state of research on these vulnerabilities and presents available defense strategies. We roughly categorize attack approaches into prompt-based, model-based, multimodal, and multilingua"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2410.15236","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2410.15236/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T00:04:12Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UMb7736ghQlpznCEekjCUirI+NlAgYtrfDLRUU0z2DDniNcud0+SrVkbu93mWadcn5G8HFskb7/B/oH68GUeCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-29T23:40:45.385814Z"},"content_sha256":"a12025dbcb63a2d1f739d4c56937238d523dc0986f83433dd7f893b499d3d3cd","schema_version":"1.0","event_id":"sha256:a12025dbcb63a2d1f739d4c56937238d523dc0986f83433dd7f893b499d3d3cd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/EA54DF5YPRNI3UHRFEJWUGWI46/bundle.json","state_url":"https://pith.science/pith/EA54DF5YPRNI3UHRFEJWUGWI46/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/EA54DF5YPRNI3UHRFEJWUGWI46/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-29T23:40:45Z","links":{"resolver":"https://pith.science/pith/EA54DF5YPRNI3UHRFEJWUGWI46","bundle":"https://pith.science/pith/EA54DF5YPRNI3UHRFEJWUGWI46/bundle.json","state":"https://pith.science/pith/EA54DF5YPRNI3UHRFEJWUGWI46/state.json","well_known_bundle":"https://pith.science/.well-known/pith/EA54DF5YPRNI3UHRFEJWUGWI46/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2024:EA54DF5YPRNI3UHRFEJWUGWI46","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6af61dd759e3ecedb66cdf5c91a433db7f65384effae5562a4e00f436a94d139","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2024-10-20T00:00:56Z","title_canon_sha256":"37db135a3f03533ef0eb26641135e9346b3ead7df6bb07b801f8bbd4c0b4132d"},"schema_version":"1.0","source":{"id":"2410.15236","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2410.15236","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"arxiv_version","alias_value":"2410.15236v4","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2410.15236","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_12","alias_value":"EA54DF5YPRNI","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_16","alias_value":"EA54DF5YPRNI3UHR","created_at":"2026-05-29T00:04:12Z"},{"alias_kind":"pith_short_8","alias_value":"EA54DF5Y","created_at":"2026-05-29T00:04:12Z"}],"graph_snapshots":[{"event_id":"sha256:a12025dbcb63a2d1f739d4c56937238d523dc0986f83433dd7f893b499d3d3cd","target":"graph","created_at":"2026-05-29T00:04:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2410.15236/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large Language Models (LLMs) have transformed artificial intelligence by advancing natural language understanding and generation, enabling applications across fields beyond healthcare, software engineering, and conversational systems. Despite these advancements in the past few years, LLMs have shown considerable vulnerabilities, particularly to prompt injection and jailbreaking attacks. This review analyzes the state of research on these vulnerabilities and presents available defense strategies. We roughly categorize attack approaches into prompt-based, model-based, multimodal, and multilingua","authors_text":"Benji Peng, Caitlyn Heqi Yin, Hanxuan Chen, Jiacheng Shi, Keyu Chen, Lawrence K.Q. Yan, Ming Liu, Pohsun Feng, Qian Niu, Riyang Bao, Tianyang Wang, Xinyuan Song, Yichao Zhang, Yizhu Wen, Ziqian Bi","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2024-10-20T00:00:56Z","title":"Jailbreaking and Mitigation of Vulnerabilities in Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2410.15236","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:e5bea73129380bba4fdf0e730fd37ee3c506b7141e42c5102230dc8109bc2677","target":"record","created_at":"2026-05-29T00:04:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6af61dd759e3ecedb66cdf5c91a433db7f65384effae5562a4e00f436a94d139","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CR","submitted_at":"2024-10-20T00:00:56Z","title_canon_sha256":"37db135a3f03533ef0eb26641135e9346b3ead7df6bb07b801f8bbd4c0b4132d"},"schema_version":"1.0","source":{"id":"2410.15236","kind":"arxiv","version":4}},"canonical_sha256":"203bc197b87c5a8dd0f129136a1ac8e79ecd09496d518900247482745ef8c813","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"203bc197b87c5a8dd0f129136a1ac8e79ecd09496d518900247482745ef8c813","first_computed_at":"2026-05-29T00:04:12.335728Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T00:04:12.335728Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"GZdotHQLtBeYodjGHeEU7GTBTDIpQi5CxlZZDUjxPMhZBocFEnDrHZaVtupuzlTwRpVkr7QuV6JBSNOVzP5RCg==","signature_status":"signed_v1","signed_at":"2026-05-29T00:04:12.336399Z","signed_message":"canonical_sha256_bytes"},"source_id":"2410.15236","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:e5bea73129380bba4fdf0e730fd37ee3c506b7141e42c5102230dc8109bc2677","sha256:a12025dbcb63a2d1f739d4c56937238d523dc0986f83433dd7f893b499d3d3cd"],"state_sha256":"c4ed82b422bfa4e24685fe62d8e2eba2686de1587596d0581c8fd38378d11ff0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hTDoyb+ReQ+YQACVHHeFHbDk0IH33hQLDv6xl8oXoIfiaziu3eg1rOSGVulISnMf4qJuafVmHVW1HG+ErQVNCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-29T23:40:45.389531Z","bundle_sha256":"fcb0ecf224fea3580dd5b21e7992dff9168e68d29534d24084af33325c8ba4c4"}}