{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:ME4U54ZQ4LU7TZIQVB45HZKRTD","short_pith_number":"pith:ME4U54ZQ","canonical_record":{"source":{"id":"1901.06328","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2019-01-18T16:32:11Z","cross_cats_sorted":["q-bio.QM","stat.ML"],"title_canon_sha256":"168269a3515195c767c58d88f74c5f7c4083bc8e821b9d23a461305997bbe764","abstract_canon_sha256":"618a2ec2a28ffcbb51e2f20b9d30914430a406d59014d86ebb4c714b7eb68f72"},"schema_version":"1.0"},"canonical_sha256":"61394ef330e2e9f9e510a879d3e55198de2cfaa05272705f5cd4d33bc61e4eb2","source":{"kind":"arxiv","id":"1901.06328","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.06328","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"arxiv_version","alias_value":"1901.06328v1","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.06328","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"pith_short_12","alias_value":"ME4U54ZQ4LU7","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"ME4U54ZQ4LU7TZIQ","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"ME4U54ZQ","created_at":"2026-05-18T12:33:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:ME4U54ZQ4LU7TZIQVB45HZKRTD","target":"record","payload":{"canonical_record":{"source":{"id":"1901.06328","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2019-01-18T16:32:11Z","cross_cats_sorted":["q-bio.QM","stat.ML"],"title_canon_sha256":"168269a3515195c767c58d88f74c5f7c4083bc8e821b9d23a461305997bbe764","abstract_canon_sha256":"618a2ec2a28ffcbb51e2f20b9d30914430a406d59014d86ebb4c714b7eb68f72"},"schema_version":"1.0"},"canonical_sha256":"61394ef330e2e9f9e510a879d3e55198de2cfaa05272705f5cd4d33bc61e4eb2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:56:01.367893Z","signature_b64":"diyy+5Zcs41tuf3HSuasgDplwq4O24Trz5MFEYYCa+zxHgfFXYlHYy55xjEtw2lG2y4dIh5Xqa63tjXAqUJaDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"61394ef330e2e9f9e510a879d3e55198de2cfaa05272705f5cd4d33bc61e4eb2","last_reissued_at":"2026-05-17T23:56:01.366891Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:56:01.366891Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1901.06328","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"c3RH7B/L1aLyU/VjFqTloFSrVDvfEmbGFNnfWg8gpd2aqw2AKX/Kzuy2VcVliYMutcMM8yOd3+xPRzlG9BAWDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T07:35:59.737670Z"},"content_sha256":"73c50ce508b1a90c338c799dc9c3044bd3772746ce82417ce838f2f8693a0ad7","schema_version":"1.0","event_id":"sha256:73c50ce508b1a90c338c799dc9c3044bd3772746ce82417ce838f2f8693a0ad7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:ME4U54ZQ4LU7TZIQVB45HZKRTD","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Estimating the effective dimension of large biological datasets using Fisher separability analysis","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["q-bio.QM","stat.ML"],"primary_cat":"cs.LG","authors_text":"Andrei Zinovyev, Jonathan Bac, Luca Albergante","submitted_at":"2019-01-18T16:32:11Z","abstract_excerpt":"Modern large-scale datasets are frequently said to be high-dimensional. However, their data point clouds frequently possess structures, significantly decreasing their intrinsic dimensionality (ID) due to the presence of clusters, points being located close to low-dimensional varieties or fine-grained lumping. We test a recently introduced dimensionality estimator, based on analysing the separability properties of data points, on several benchmarks and real biological datasets. We show that the introduced measure of ID has performance competitive with state-of-the-art measures, being efficient "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.06328","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:56:01Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"s+8FJkjfaGuy5SzpXsDqjMygEh2gJeVUYC5KRjxpGw1TaRUROlfwPSHkB9gt9/sWYLL/XTSBS1q84j8vcnJPDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T07:35:59.738293Z"},"content_sha256":"b4f025d9c09cd501093a69bb1ec29695402c58e307e451c33b13e5213b6702d2","schema_version":"1.0","event_id":"sha256:b4f025d9c09cd501093a69bb1ec29695402c58e307e451c33b13e5213b6702d2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/bundle.json","state_url":"https://pith.science/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T07:35:59Z","links":{"resolver":"https://pith.science/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD","bundle":"https://pith.science/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/bundle.json","state":"https://pith.science/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ME4U54ZQ4LU7TZIQVB45HZKRTD/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:ME4U54ZQ4LU7TZIQVB45HZKRTD","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"618a2ec2a28ffcbb51e2f20b9d30914430a406d59014d86ebb4c714b7eb68f72","cross_cats_sorted":["q-bio.QM","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2019-01-18T16:32:11Z","title_canon_sha256":"168269a3515195c767c58d88f74c5f7c4083bc8e821b9d23a461305997bbe764"},"schema_version":"1.0","source":{"id":"1901.06328","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1901.06328","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"arxiv_version","alias_value":"1901.06328v1","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1901.06328","created_at":"2026-05-17T23:56:01Z"},{"alias_kind":"pith_short_12","alias_value":"ME4U54ZQ4LU7","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_16","alias_value":"ME4U54ZQ4LU7TZIQ","created_at":"2026-05-18T12:33:21Z"},{"alias_kind":"pith_short_8","alias_value":"ME4U54ZQ","created_at":"2026-05-18T12:33:21Z"}],"graph_snapshots":[{"event_id":"sha256:b4f025d9c09cd501093a69bb1ec29695402c58e307e451c33b13e5213b6702d2","target":"graph","created_at":"2026-05-17T23:56:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Modern large-scale datasets are frequently said to be high-dimensional. However, their data point clouds frequently possess structures, significantly decreasing their intrinsic dimensionality (ID) due to the presence of clusters, points being located close to low-dimensional varieties or fine-grained lumping. We test a recently introduced dimensionality estimator, based on analysing the separability properties of data points, on several benchmarks and real biological datasets. We show that the introduced measure of ID has performance competitive with state-of-the-art measures, being efficient ","authors_text":"Andrei Zinovyev, Jonathan Bac, Luca Albergante","cross_cats":["q-bio.QM","stat.ML"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2019-01-18T16:32:11Z","title":"Estimating the effective dimension of large biological datasets using Fisher separability analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1901.06328","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:73c50ce508b1a90c338c799dc9c3044bd3772746ce82417ce838f2f8693a0ad7","target":"record","created_at":"2026-05-17T23:56:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"618a2ec2a28ffcbb51e2f20b9d30914430a406d59014d86ebb4c714b7eb68f72","cross_cats_sorted":["q-bio.QM","stat.ML"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2019-01-18T16:32:11Z","title_canon_sha256":"168269a3515195c767c58d88f74c5f7c4083bc8e821b9d23a461305997bbe764"},"schema_version":"1.0","source":{"id":"1901.06328","kind":"arxiv","version":1}},"canonical_sha256":"61394ef330e2e9f9e510a879d3e55198de2cfaa05272705f5cd4d33bc61e4eb2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"61394ef330e2e9f9e510a879d3e55198de2cfaa05272705f5cd4d33bc61e4eb2","first_computed_at":"2026-05-17T23:56:01.366891Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:56:01.366891Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"diyy+5Zcs41tuf3HSuasgDplwq4O24Trz5MFEYYCa+zxHgfFXYlHYy55xjEtw2lG2y4dIh5Xqa63tjXAqUJaDA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:56:01.367893Z","signed_message":"canonical_sha256_bytes"},"source_id":"1901.06328","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:73c50ce508b1a90c338c799dc9c3044bd3772746ce82417ce838f2f8693a0ad7","sha256:b4f025d9c09cd501093a69bb1ec29695402c58e307e451c33b13e5213b6702d2"],"state_sha256":"2f9bd723ca21300e5d613c430491bedf42df2d25887f98abcd17f470b6f1c76c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"AF9uLl/g1i4S1X6ti5nONMZE5xMvyYKSctVqURVoejV+vI4/oLwBxFopg+l3yBSsKnY+KLleSQKSrtsDrmNZCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T07:35:59.741801Z","bundle_sha256":"684862bdfd0d85ff432f09546c6cb1cf2a7968215de7adc7a16a32ac44155c11"}}