{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2012:XTX3Y3UEW42YHBB37L6EBF4F3O","short_pith_number":"pith:XTX3Y3UE","schema_version":"1.0","canonical_sha256":"bcefbc6e84b73583843bfafc409785db9fb9b7b89c9e9218aa415f75c373532c","source":{"kind":"arxiv","id":"1203.1878","version":1},"attestation_state":"computed","paper":{"title":"Outlier detection from ETL Execution trace","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":[],"primary_cat":"cs.DB","authors_text":"Amlan Chakrabarti, Samiran Ghosh, Saptarsi Goswami","submitted_at":"2012-03-08T18:30:25Z","abstract_excerpt":"Extract, Transform, Load (ETL) is an integral part of Data Warehousing (DW) implementation. The commercial tools that are used for this purpose captures lot of execution trace in form of various log files with plethora of information. However there has been hardly any initiative where any proactive analyses have been done on the ETL logs to improve their efficiency. In this paper we utilize outlier detection technique to find the processes varying most from the group in terms of execution trace. As our experiment was carried on actual production processes, any outlier we would consider as a si"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1203.1878","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.DB","submitted_at":"2012-03-08T18:30:25Z","cross_cats_sorted":[],"title_canon_sha256":"93540011b9f2196e5038e95773d9d5c30563301b2e01c367fc23f0f825b45483","abstract_canon_sha256":"f2888e82a841ec90bf19f2637d94fe0ab869c6e882f45ecbc19c2288af1ab1fd"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T04:00:36.686570Z","signature_b64":"gsiaTFvIjtLESB+zm9CW8/ajdsVq42NWI2hl4D1GBh9nOra44ih6Kz3n9xlIODfaMkqb/Lxur2Af8/IJ1GsUAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bcefbc6e84b73583843bfafc409785db9fb9b7b89c9e9218aa415f75c373532c","last_reissued_at":"2026-05-18T04:00:36.686035Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T04:00:36.686035Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Outlier detection from ETL Execution trace","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":[],"primary_cat":"cs.DB","authors_text":"Amlan Chakrabarti, Samiran Ghosh, Saptarsi Goswami","submitted_at":"2012-03-08T18:30:25Z","abstract_excerpt":"Extract, Transform, Load (ETL) is an integral part of Data Warehousing (DW) implementation. The commercial tools that are used for this purpose captures lot of execution trace in form of various log files with plethora of information. However there has been hardly any initiative where any proactive analyses have been done on the ETL logs to improve their efficiency. In this paper we utilize outlier detection technique to find the processes varying most from the group in terms of execution trace. As our experiment was carried on actual production processes, any outlier we would consider as a si"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1203.1878","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1203.1878","created_at":"2026-05-18T04:00:36.686116+00:00"},{"alias_kind":"arxiv_version","alias_value":"1203.1878v1","created_at":"2026-05-18T04:00:36.686116+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1203.1878","created_at":"2026-05-18T04:00:36.686116+00:00"},{"alias_kind":"pith_short_12","alias_value":"XTX3Y3UEW42Y","created_at":"2026-05-18T12:27:27.928770+00:00"},{"alias_kind":"pith_short_16","alias_value":"XTX3Y3UEW42YHBB3","created_at":"2026-05-18T12:27:27.928770+00:00"},{"alias_kind":"pith_short_8","alias_value":"XTX3Y3UE","created_at":"2026-05-18T12:27:27.928770+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O","json":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O.json","graph_json":"https://pith.science/api/pith-number/XTX3Y3UEW42YHBB37L6EBF4F3O/graph.json","events_json":"https://pith.science/api/pith-number/XTX3Y3UEW42YHBB37L6EBF4F3O/events.json","paper":"https://pith.science/paper/XTX3Y3UE"},"agent_actions":{"view_html":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O","download_json":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O.json","view_paper":"https://pith.science/paper/XTX3Y3UE","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1203.1878&json=true","fetch_graph":"https://pith.science/api/pith-number/XTX3Y3UEW42YHBB37L6EBF4F3O/graph.json","fetch_events":"https://pith.science/api/pith-number/XTX3Y3UEW42YHBB37L6EBF4F3O/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O/action/timestamp_anchor","attest_storage":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O/action/storage_attestation","attest_author":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O/action/author_attestation","sign_citation":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O/action/citation_signature","submit_replication":"https://pith.science/pith/XTX3Y3UEW42YHBB37L6EBF4F3O/action/replication_record"}},"created_at":"2026-05-18T04:00:36.686116+00:00","updated_at":"2026-05-18T04:00:36.686116+00:00"}