{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:NKOVNBGSHOR2OLJFDZXPQOJJVR","short_pith_number":"pith:NKOVNBGS","canonical_record":{"source":{"id":"1901.11040","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-30T19:00:21Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"0b1826286c7e91f340583514ad33bc88e314b346cd2c0123cb7a09b92c3dbb7e","abstract_canon_sha256":"30c79bdab1a36fd4676f79d1f62bd39b9be9b246e7e5e5857bc8e79eb93882f5"},"schema_version":"1.0"},"canonical_sha256":"6a9d5684d23ba3a72d251e6ef83929ac6c9c0b3c717734c9425f1a4a53721605","source":{"kind":"arxiv","id":"1901.11040","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.11040","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"arxiv_version","alias_value":"1901.11040v1","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.11040","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"pith_short_12","alias_value":"NKOVNBGSHOR2","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_16","alias_value":"NKOVNBGSHOR2OLJF","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_8","alias_value":"NKOVNBGS","created_at":"2026-05-18T12:33:24Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:NKOVNBGSHOR2OLJFDZXPQOJJVR","target":"record","payload":{"canonical_record":{"source":{"id":"1901.11040","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-30T19:00:21Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"0b1826286c7e91f340583514ad33bc88e314b346cd2c0123cb7a09b92c3dbb7e","abstract_canon_sha256":"30c79bdab1a36fd4676f79d1f62bd39b9be9b246e7e5e5857bc8e79eb93882f5"},"schema_version":"1.0"},"canonical_sha256":"6a9d5684d23ba3a72d251e6ef83929ac6c9c0b3c717734c9425f1a4a53721605","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:55:02.780164Z","signature_b64":"2Ij/jstEZrnyDWGh4iU3bcDVv2xBJbDIL/4GmNdbyed9uOFvvtilqksZ9ll0Y6CZXhd/MM32Sbs83mkt/zG2Cw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6a9d5684d23ba3a72d251e6ef83929ac6c9c0b3c717734c9425f1a4a53721605","last_reissued_at":"2026-05-17T23:55:02.779579Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:55:02.779579Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1901.11040","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:55:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KRPHdlSWHp1tuIsyN1AS3kCDcKLkvU1psOcHsmdHP1JVcLqA67CeRWBW5TrAf/VVW7jOTObGGlKbEMRyKDjCDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T17:30:31.324333Z"},"content_sha256":"32d880be256206af274db563008279a9437ed4ccd7d0b97ac63cce65ed005cbd","schema_version":"1.0","event_id":"sha256:32d880be256206af274db563008279a9437ed4ccd7d0b97ac63cce65ed005cbd"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:NKOVNBGSHOR2OLJFDZXPQOJJVR","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The Wilderness Area Data Set: Adapting the Covertype data set for unsupervised learning","license":"http://creativecommons.org/publicdomain/zero/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Jakub Zgraja, Richard Hugh Moulton","submitted_at":"2019-01-30T19:00:21Z","abstract_excerpt":"Benchmark data sets are of vital importance in machine learning research, as indicated by the number of repositories that exist to make them publicly available. Although many of these are usable in the stream mining context as well, it is less obvious which data sets can be used to evaluate data stream clustering algorithms. We note that the classic Covertype data set's size makes it attractive for use in stream mining but unfortunately it is specifically designed for classification. Here we detail the process of transforming the Covertype data set into one amenable for unsupervised learning, "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.11040","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:55:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jdrzX4WV3lxJEQPvlbLqOgfvg/gCwHtgfIKvdpfKUMkV0HqQOHAI9xiUWkjYMAfiiMG3f2sJEgRcXJxyyLS2Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T17:30:31.324987Z"},"content_sha256":"549b28c717062a5697d56c86f91b76c95fa9d3fffd7fa41847a2d00084661fcd","schema_version":"1.0","event_id":"sha256:549b28c717062a5697d56c86f91b76c95fa9d3fffd7fa41847a2d00084661fcd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/bundle.json","state_url":"https://pith.science/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T17:30:31Z","links":{"resolver":"https://pith.science/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR","bundle":"https://pith.science/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/bundle.json","state":"https://pith.science/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NKOVNBGSHOR2OLJFDZXPQOJJVR/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:NKOVNBGSHOR2OLJFDZXPQOJJVR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"30c79bdab1a36fd4676f79d1f62bd39b9be9b246e7e5e5857bc8e79eb93882f5","cross_cats_sorted":["stat.ML"],"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-30T19:00:21Z","title_canon_sha256":"0b1826286c7e91f340583514ad33bc88e314b346cd2c0123cb7a09b92c3dbb7e"},"schema_version":"1.0","source":{"id":"1901.11040","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.11040","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"arxiv_version","alias_value":"1901.11040v1","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.11040","created_at":"2026-05-17T23:55:02Z"},{"alias_kind":"pith_short_12","alias_value":"NKOVNBGSHOR2","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_16","alias_value":"NKOVNBGSHOR2OLJF","created_at":"2026-05-18T12:33:24Z"},{"alias_kind":"pith_short_8","alias_value":"NKOVNBGS","created_at":"2026-05-18T12:33:24Z"}],"graph_snapshots":[{"event_id":"sha256:549b28c717062a5697d56c86f91b76c95fa9d3fffd7fa41847a2d00084661fcd","target":"graph","created_at":"2026-05-17T23:55:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Benchmark data sets are of vital importance in machine learning research, as indicated by the number of repositories that exist to make them publicly available. Although many of these are usable in the stream mining context as well, it is less obvious which data sets can be used to evaluate data stream clustering algorithms. We note that the classic Covertype data set's size makes it attractive for use in stream mining but unfortunately it is specifically designed for classification. Here we detail the process of transforming the Covertype data set into one amenable for unsupervised learning, ","authors_text":"Jakub Zgraja, Richard Hugh Moulton","cross_cats":["stat.ML"],"headline":"","license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-30T19:00:21Z","title":"The Wilderness Area Data Set: Adapting the Covertype data set for unsupervised learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.11040","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:32d880be256206af274db563008279a9437ed4ccd7d0b97ac63cce65ed005cbd","target":"record","created_at":"2026-05-17T23:55:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"30c79bdab1a36fd4676f79d1f62bd39b9be9b246e7e5e5857bc8e79eb93882f5","cross_cats_sorted":["stat.ML"],"license":"http://creativecommons.org/publicdomain/zero/1.0/","primary_cat":"cs.LG","submitted_at":"2019-01-30T19:00:21Z","title_canon_sha256":"0b1826286c7e91f340583514ad33bc88e314b346cd2c0123cb7a09b92c3dbb7e"},"schema_version":"1.0","source":{"id":"1901.11040","kind":"arxiv","version":1}},"canonical_sha256":"6a9d5684d23ba3a72d251e6ef83929ac6c9c0b3c717734c9425f1a4a53721605","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6a9d5684d23ba3a72d251e6ef83929ac6c9c0b3c717734c9425f1a4a53721605","first_computed_at":"2026-05-17T23:55:02.779579Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:55:02.779579Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"2Ij/jstEZrnyDWGh4iU3bcDVv2xBJbDIL/4GmNdbyed9uOFvvtilqksZ9ll0Y6CZXhd/MM32Sbs83mkt/zG2Cw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:55:02.780164Z","signed_message":"canonical_sha256_bytes"},"source_id":"1901.11040","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:32d880be256206af274db563008279a9437ed4ccd7d0b97ac63cce65ed005cbd","sha256:549b28c717062a5697d56c86f91b76c95fa9d3fffd7fa41847a2d00084661fcd"],"state_sha256":"edc78dd6b3cd6d6e97ae38c5a5c71c0477f590b3f6ca7a7a371725ce7dd330c1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NvvrfwT6REreoR1EbCmGHea7shBMC1lbGPTEqy4cITVwtJmmj27rMDC6GWYfNWn7N//rzOR4/YMZSrp1eTWVCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T17:30:31.328379Z","bundle_sha256":"e6fc6bbf1e2de1e3c58d2ae306db3af9016c240c05e6eea21ac006a891feff60"}}