{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:QGF4XNVBTUKF467VNYRLGEYEYR","short_pith_number":"pith:QGF4XNVB","canonical_record":{"source":{"id":"1711.03229","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2017-11-09T01:55:44Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"0e79972be5ab65986c67fc2f8717bad5e9a9802e9126730977d39a5e92047024","abstract_canon_sha256":"82385a1b290331c3fa75125b8f5b6fb968dd536ca8b460297cc2ca95c068fd86"},"schema_version":"1.0"},"canonical_sha256":"818bcbb6a19d145e7bf56e22b31304c44ec9aa12956539ec7f4d99b7fd7f5814","source":{"kind":"arxiv","id":"1711.03229","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.03229","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"arxiv_version","alias_value":"1711.03229v1","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.03229","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"pith_short_12","alias_value":"QGF4XNVBTUKF","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"QGF4XNVBTUKF467V","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"QGF4XNVB","created_at":"2026-05-18T12:31:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:QGF4XNVBTUKF467VNYRLGEYEYR","target":"record","payload":{"canonical_record":{"source":{"id":"1711.03229","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2017-11-09T01:55:44Z","cross_cats_sorted":["cs.DC"],"title_canon_sha256":"0e79972be5ab65986c67fc2f8717bad5e9a9802e9126730977d39a5e92047024","abstract_canon_sha256":"82385a1b290331c3fa75125b8f5b6fb968dd536ca8b460297cc2ca95c068fd86"},"schema_version":"1.0"},"canonical_sha256":"818bcbb6a19d145e7bf56e22b31304c44ec9aa12956539ec7f4d99b7fd7f5814","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:30:56.862736Z","signature_b64":"blPaD8h8dK+XKnY8sRyjvlMbyC+BxcnVG/BTyLfgO0mDxYWa+SH+vXtvmi8j5o2ufmj77GN2ALBdZ+XeDIUPCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"818bcbb6a19d145e7bf56e22b31304c44ec9aa12956539ec7f4d99b7fd7f5814","last_reissued_at":"2026-05-18T00:30:56.862119Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:30:56.862119Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1711.03229","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:30:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ThmetzNVcUWIQcPNt6ciacAOTMS4s9Eresi252aUgqqc0ncJuIgVve/AnkZRFxwXz/png/zTrCyUyPpyB8zpCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:49:02.886236Z"},"content_sha256":"8a1a79a498f16acb2a9ae1f27e4e35fc65cde02bb3165f8f905762ba30505615","schema_version":"1.0","event_id":"sha256:8a1a79a498f16acb2a9ae1f27e4e35fc65cde02bb3165f8f905762ba30505615"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:QGF4XNVBTUKF467VNYRLGEYEYR","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Dwarf-based Scalable Big Data Benchmarking Methodology","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.DC"],"primary_cat":"cs.AR","authors_text":"Biwei Xie, Chen Zheng, Chunjie Luo, Daoyi Zheng, Haibin Wang, Jianfeng Zhan, Lei Wang, Qiang Yang, Wanling Gao, Zhen Jia","submitted_at":"2017-11-09T01:55:44Z","abstract_excerpt":"Different from the traditional benchmarking methodology that creates a new benchmark or proxy for every possible workload, this paper presents a scalable big data benchmarking methodology. Among a wide variety of big data analytics workloads, we identify eight big data dwarfs, each of which captures the common requirements of each class of unit of computation while being reasonably divorced from individual implementations. We implement the eight dwarfs on different software stacks, e.g., OpenMP, MPI, Hadoop as the dwarf components. For the purpose of architecture simulation, we construct and t"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.03229","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:30:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FltRG57nvs3jBDdQVwyLMYvoBOq7hAJnUYevX7ZrIjEXroGyHYUao2qb3Z6SHCnQYvQEL30RkrAZKKnzdczoBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:49:02.886965Z"},"content_sha256":"4082dd3fa5546b808badb1f951aa0de8fbee2400ee9c50e206aeab4ffbea9c07","schema_version":"1.0","event_id":"sha256:4082dd3fa5546b808badb1f951aa0de8fbee2400ee9c50e206aeab4ffbea9c07"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QGF4XNVBTUKF467VNYRLGEYEYR/bundle.json","state_url":"https://pith.science/pith/QGF4XNVBTUKF467VNYRLGEYEYR/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QGF4XNVBTUKF467VNYRLGEYEYR/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T20:49:02Z","links":{"resolver":"https://pith.science/pith/QGF4XNVBTUKF467VNYRLGEYEYR","bundle":"https://pith.science/pith/QGF4XNVBTUKF467VNYRLGEYEYR/bundle.json","state":"https://pith.science/pith/QGF4XNVBTUKF467VNYRLGEYEYR/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QGF4XNVBTUKF467VNYRLGEYEYR/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:QGF4XNVBTUKF467VNYRLGEYEYR","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"82385a1b290331c3fa75125b8f5b6fb968dd536ca8b460297cc2ca95c068fd86","cross_cats_sorted":["cs.DC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2017-11-09T01:55:44Z","title_canon_sha256":"0e79972be5ab65986c67fc2f8717bad5e9a9802e9126730977d39a5e92047024"},"schema_version":"1.0","source":{"id":"1711.03229","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1711.03229","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"arxiv_version","alias_value":"1711.03229v1","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.03229","created_at":"2026-05-18T00:30:56Z"},{"alias_kind":"pith_short_12","alias_value":"QGF4XNVBTUKF","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_16","alias_value":"QGF4XNVBTUKF467V","created_at":"2026-05-18T12:31:37Z"},{"alias_kind":"pith_short_8","alias_value":"QGF4XNVB","created_at":"2026-05-18T12:31:37Z"}],"graph_snapshots":[{"event_id":"sha256:4082dd3fa5546b808badb1f951aa0de8fbee2400ee9c50e206aeab4ffbea9c07","target":"graph","created_at":"2026-05-18T00:30:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Different from the traditional benchmarking methodology that creates a new benchmark or proxy for every possible workload, this paper presents a scalable big data benchmarking methodology. Among a wide variety of big data analytics workloads, we identify eight big data dwarfs, each of which captures the common requirements of each class of unit of computation while being reasonably divorced from individual implementations. We implement the eight dwarfs on different software stacks, e.g., OpenMP, MPI, Hadoop as the dwarf components. For the purpose of architecture simulation, we construct and t","authors_text":"Biwei Xie, Chen Zheng, Chunjie Luo, Daoyi Zheng, Haibin Wang, Jianfeng Zhan, Lei Wang, Qiang Yang, Wanling Gao, Zhen Jia","cross_cats":["cs.DC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2017-11-09T01:55:44Z","title":"A Dwarf-based Scalable Big Data Benchmarking Methodology"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.03229","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8a1a79a498f16acb2a9ae1f27e4e35fc65cde02bb3165f8f905762ba30505615","target":"record","created_at":"2026-05-18T00:30:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"82385a1b290331c3fa75125b8f5b6fb968dd536ca8b460297cc2ca95c068fd86","cross_cats_sorted":["cs.DC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AR","submitted_at":"2017-11-09T01:55:44Z","title_canon_sha256":"0e79972be5ab65986c67fc2f8717bad5e9a9802e9126730977d39a5e92047024"},"schema_version":"1.0","source":{"id":"1711.03229","kind":"arxiv","version":1}},"canonical_sha256":"818bcbb6a19d145e7bf56e22b31304c44ec9aa12956539ec7f4d99b7fd7f5814","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"818bcbb6a19d145e7bf56e22b31304c44ec9aa12956539ec7f4d99b7fd7f5814","first_computed_at":"2026-05-18T00:30:56.862119Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:30:56.862119Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"blPaD8h8dK+XKnY8sRyjvlMbyC+BxcnVG/BTyLfgO0mDxYWa+SH+vXtvmi8j5o2ufmj77GN2ALBdZ+XeDIUPCQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:30:56.862736Z","signed_message":"canonical_sha256_bytes"},"source_id":"1711.03229","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8a1a79a498f16acb2a9ae1f27e4e35fc65cde02bb3165f8f905762ba30505615","sha256:4082dd3fa5546b808badb1f951aa0de8fbee2400ee9c50e206aeab4ffbea9c07"],"state_sha256":"e528b5668d9d94c0843998336963686fc0c9d768387dfec1e480350de8a4c0be"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jxEB6pQNArsV0UFI/8h+ajBLdqEOxToRKqefpzT9CN5tZxmmdMnyaTlls3Dshz28N0hgsO0FbfCWD/R5chxLBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T20:49:02.890539Z","bundle_sha256":"b35448340ffae3689944ba4ad3eb3e11748b0727b8dd34f819e4377058a219fc"}}