{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:BWHEO4NBDKOHSW3HZH6PEHS2S2","short_pith_number":"pith:BWHEO4NB","canonical_record":{"source":{"id":"1707.05261","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-17T16:12:34Z","cross_cats_sorted":[],"title_canon_sha256":"766e756cc80095166aea982153f7227374059f72cfe3f81ed0d34099f2b5241f","abstract_canon_sha256":"35db84b032c9595311484eb310ec43b0adee607b5163e2967a84894b8bfd9611"},"schema_version":"1.0"},"canonical_sha256":"0d8e4771a11a9c795b67c9fcf21e5a96b2fee90a7c701e6ca87cefe41f01d023","source":{"kind":"arxiv","id":"1707.05261","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.05261","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"arxiv_version","alias_value":"1707.05261v1","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.05261","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"pith_short_12","alias_value":"BWHEO4NBDKOH","created_at":"2026-05-18T12:31:08Z"},{"alias_kind":"pith_short_16","alias_value":"BWHEO4NBDKOHSW3H","created_at":"2026-05-18T12:31:08Z"},{"alias_kind":"pith_short_8","alias_value":"BWHEO4NB","created_at":"2026-05-18T12:31:08Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:BWHEO4NBDKOHSW3HZH6PEHS2S2","target":"record","payload":{"canonical_record":{"source":{"id":"1707.05261","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-17T16:12:34Z","cross_cats_sorted":[],"title_canon_sha256":"766e756cc80095166aea982153f7227374059f72cfe3f81ed0d34099f2b5241f","abstract_canon_sha256":"35db84b032c9595311484eb310ec43b0adee607b5163e2967a84894b8bfd9611"},"schema_version":"1.0"},"canonical_sha256":"0d8e4771a11a9c795b67c9fcf21e5a96b2fee90a7c701e6ca87cefe41f01d023","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:40:09.054345Z","signature_b64":"TCcuyFTKVIJJ59it51k/fAy8Ccc81CTjpR0vU6Xq6nrFV0OJ3C7GUu4fgwA7CdbTm7t+AnYpZmokchjqB9bCAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0d8e4771a11a9c795b67c9fcf21e5a96b2fee90a7c701e6ca87cefe41f01d023","last_reissued_at":"2026-05-18T00:40:09.053872Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:40:09.053872Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1707.05261","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:40:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pxy4qKlyynddiJdq/KqXQi6gV10J3C4G/pUcqE0LIhECNnvnL+5AJEPLLaacV2mMXJ1kX7fi9fKWIpgMibbDBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T11:22:51.033901Z"},"content_sha256":"57200f1a4427b6d9ebc5805b44185aac94115128098f48ade5b27e50ef4078d6","schema_version":"1.0","event_id":"sha256:57200f1a4427b6d9ebc5805b44185aac94115128098f48ade5b27e50ef4078d6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:BWHEO4NBDKOHSW3HZH6PEHS2S2","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Exploring text datasets by visualizing relevant words","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Franziska Horn, Gr\\'egoire Montavon, Klaus-Robert M\\\"uller, Leila Arras, Wojciech Samek","submitted_at":"2017-07-17T16:12:34Z","abstract_excerpt":"When working with a new dataset, it is important to first explore and familiarize oneself with it, before applying any advanced machine learning algorithms. However, to the best of our knowledge, no tools exist that quickly and reliably give insight into the contents of a selection of documents with respect to what distinguishes them from other documents belonging to different categories. In this paper we propose to extract `relevant words' from a collection of texts, which summarize the contents of documents belonging to a certain class (or discovered cluster in the case of unlabeled datasets"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.05261","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:40:09Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6aCOE6maffZuNh01XRo7gcYkEbbgyKXgaxiDOj4LVc3M3x7s7cwHRzLk5LKSwWukaWZ45QJ9kIj4IbHjmONYDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T11:22:51.034246Z"},"content_sha256":"f47c015bab51e5a5dfcdc300eb010c0dc5b40ec4741cac0819155f0642649a99","schema_version":"1.0","event_id":"sha256:f47c015bab51e5a5dfcdc300eb010c0dc5b40ec4741cac0819155f0642649a99"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/bundle.json","state_url":"https://pith.science/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T11:22:51Z","links":{"resolver":"https://pith.science/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2","bundle":"https://pith.science/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/bundle.json","state":"https://pith.science/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BWHEO4NBDKOHSW3HZH6PEHS2S2/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:BWHEO4NBDKOHSW3HZH6PEHS2S2","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"35db84b032c9595311484eb310ec43b0adee607b5163e2967a84894b8bfd9611","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-17T16:12:34Z","title_canon_sha256":"766e756cc80095166aea982153f7227374059f72cfe3f81ed0d34099f2b5241f"},"schema_version":"1.0","source":{"id":"1707.05261","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1707.05261","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"arxiv_version","alias_value":"1707.05261v1","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1707.05261","created_at":"2026-05-18T00:40:09Z"},{"alias_kind":"pith_short_12","alias_value":"BWHEO4NBDKOH","created_at":"2026-05-18T12:31:08Z"},{"alias_kind":"pith_short_16","alias_value":"BWHEO4NBDKOHSW3H","created_at":"2026-05-18T12:31:08Z"},{"alias_kind":"pith_short_8","alias_value":"BWHEO4NB","created_at":"2026-05-18T12:31:08Z"}],"graph_snapshots":[{"event_id":"sha256:f47c015bab51e5a5dfcdc300eb010c0dc5b40ec4741cac0819155f0642649a99","target":"graph","created_at":"2026-05-18T00:40:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"When working with a new dataset, it is important to first explore and familiarize oneself with it, before applying any advanced machine learning algorithms. However, to the best of our knowledge, no tools exist that quickly and reliably give insight into the contents of a selection of documents with respect to what distinguishes them from other documents belonging to different categories. In this paper we propose to extract `relevant words' from a collection of texts, which summarize the contents of documents belonging to a certain class (or discovered cluster in the case of unlabeled datasets","authors_text":"Franziska Horn, Gr\\'egoire Montavon, Klaus-Robert M\\\"uller, Leila Arras, Wojciech Samek","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-17T16:12:34Z","title":"Exploring text datasets by visualizing relevant words"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1707.05261","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:57200f1a4427b6d9ebc5805b44185aac94115128098f48ade5b27e50ef4078d6","target":"record","created_at":"2026-05-18T00:40:09Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"35db84b032c9595311484eb310ec43b0adee607b5163e2967a84894b8bfd9611","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-07-17T16:12:34Z","title_canon_sha256":"766e756cc80095166aea982153f7227374059f72cfe3f81ed0d34099f2b5241f"},"schema_version":"1.0","source":{"id":"1707.05261","kind":"arxiv","version":1}},"canonical_sha256":"0d8e4771a11a9c795b67c9fcf21e5a96b2fee90a7c701e6ca87cefe41f01d023","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0d8e4771a11a9c795b67c9fcf21e5a96b2fee90a7c701e6ca87cefe41f01d023","first_computed_at":"2026-05-18T00:40:09.053872Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:40:09.053872Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"TCcuyFTKVIJJ59it51k/fAy8Ccc81CTjpR0vU6Xq6nrFV0OJ3C7GUu4fgwA7CdbTm7t+AnYpZmokchjqB9bCAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:40:09.054345Z","signed_message":"canonical_sha256_bytes"},"source_id":"1707.05261","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:57200f1a4427b6d9ebc5805b44185aac94115128098f48ade5b27e50ef4078d6","sha256:f47c015bab51e5a5dfcdc300eb010c0dc5b40ec4741cac0819155f0642649a99"],"state_sha256":"110aefa51f3e919246cbac5e0cf92d0ecc9c4476eb2b6b1fd641ceb2f4d2ea3e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1T+RFgKfPRTtlAzwnX5y8Skm3yrGJd4jaFjULCytVh8RhsrLEOE1S4YyUZIc5qQ3ns9v8geVwXa2pl65ZZtyCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T11:22:51.036208Z","bundle_sha256":"7c8d7bc48ed2d748aceb4cc1cd54ecd9b2f9a50d45c847ded4754070969fb214"}}