{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2014:KMIE6XY57MICXMUUEGXKW4XIF7","short_pith_number":"pith:KMIE6XY5","schema_version":"1.0","canonical_sha256":"53104f5f1dfb102bb29421aeab72e82fc1ad92ed238b0429cc1b430f2bce8103","source":{"kind":"arxiv","id":"1401.0355","version":2},"attestation_state":"computed","paper":{"title":"Improving the Load Balance of MapReduce Operations based on the Key Distribution of Pairs","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Bo Gao, Fa Zhang, Liya Fan, Xi Sun, Zhiyong Liu","submitted_at":"2014-01-02T01:42:23Z","abstract_excerpt":"Load balance is important for MapReduce to reduce job duration, increase parallel efficiency, etc. Previous work focuses on coarse-grained scheduling. This study concerns fine-grained scheduling on MapReduce operations. Each operation represents one invocation of the Map or Reduce function. Scheduling MapReduce operations is difficult due to highly screwed operation loads, no support to collect workload statistics, and high complexity of the scheduling problem. So current implementations adopt simple strategies, leading to poor load balance. To address these difficulties, we design an algorith"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1401.0355","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.DC","submitted_at":"2014-01-02T01:42:23Z","cross_cats_sorted":[],"title_canon_sha256":"ae98810abd1c4794fc1b0c9b124647ca4c4395ffe04ad6aec8764a68aed17674","abstract_canon_sha256":"a98b85810be61670c1c32a6f13125ae125ee6e13cab780912528285c0d19eb2b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:54:20.980949Z","signature_b64":"B0gCiZz5KxWMauk2ZzKG/2gtu8Ra0P7XKsFeVkKZubdU3eT4IrAmNumqN1aZrHvEIkdIMCwXa4xsHfZ0CuLgDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"53104f5f1dfb102bb29421aeab72e82fc1ad92ed238b0429cc1b430f2bce8103","last_reissued_at":"2026-05-18T02:54:20.980526Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:54:20.980526Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Improving the Load Balance of MapReduce Operations based on the Key Distribution of Pairs","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.DC","authors_text":"Bo Gao, Fa Zhang, Liya Fan, Xi Sun, Zhiyong Liu","submitted_at":"2014-01-02T01:42:23Z","abstract_excerpt":"Load balance is important for MapReduce to reduce job duration, increase parallel efficiency, etc. Previous work focuses on coarse-grained scheduling. This study concerns fine-grained scheduling on MapReduce operations. Each operation represents one invocation of the Map or Reduce function. Scheduling MapReduce operations is difficult due to highly screwed operation loads, no support to collect workload statistics, and high complexity of the scheduling problem. So current implementations adopt simple strategies, leading to poor load balance. To address these difficulties, we design an algorith"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1401.0355","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1401.0355","created_at":"2026-05-18T02:54:20.980591+00:00"},{"alias_kind":"arxiv_version","alias_value":"1401.0355v2","created_at":"2026-05-18T02:54:20.980591+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1401.0355","created_at":"2026-05-18T02:54:20.980591+00:00"},{"alias_kind":"pith_short_12","alias_value":"KMIE6XY57MIC","created_at":"2026-05-18T12:28:35.611951+00:00"},{"alias_kind":"pith_short_16","alias_value":"KMIE6XY57MICXMUU","created_at":"2026-05-18T12:28:35.611951+00:00"},{"alias_kind":"pith_short_8","alias_value":"KMIE6XY5","created_at":"2026-05-18T12:28:35.611951+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7","json":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7.json","graph_json":"https://pith.science/api/pith-number/KMIE6XY57MICXMUUEGXKW4XIF7/graph.json","events_json":"https://pith.science/api/pith-number/KMIE6XY57MICXMUUEGXKW4XIF7/events.json","paper":"https://pith.science/paper/KMIE6XY5"},"agent_actions":{"view_html":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7","download_json":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7.json","view_paper":"https://pith.science/paper/KMIE6XY5","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1401.0355&json=true","fetch_graph":"https://pith.science/api/pith-number/KMIE6XY57MICXMUUEGXKW4XIF7/graph.json","fetch_events":"https://pith.science/api/pith-number/KMIE6XY57MICXMUUEGXKW4XIF7/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7/action/timestamp_anchor","attest_storage":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7/action/storage_attestation","attest_author":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7/action/author_attestation","sign_citation":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7/action/citation_signature","submit_replication":"https://pith.science/pith/KMIE6XY57MICXMUUEGXKW4XIF7/action/replication_record"}},"created_at":"2026-05-18T02:54:20.980591+00:00","updated_at":"2026-05-18T02:54:20.980591+00:00"}