{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:4XX643Z55LEQTHJPTOQ2QXFZ2E","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9ce6bfcb1226afa0d45668fdb5bff3b4bec593147320427a57f9abb7d90f6663","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2017-01-05T14:14:52Z","title_canon_sha256":"88c927bd8383fa79eca5f99de120bd33191e10ddd692bf9d0a7555e002fdf941"},"schema_version":"1.0","source":{"id":"1701.01325","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1701.01325","created_at":"2026-05-18T00:53:19Z"},{"alias_kind":"arxiv_version","alias_value":"1701.01325v1","created_at":"2026-05-18T00:53:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1701.01325","created_at":"2026-05-18T00:53:19Z"},{"alias_kind":"pith_short_12","alias_value":"4XX643Z55LEQ","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_16","alias_value":"4XX643Z55LEQTHJP","created_at":"2026-05-18T12:31:00Z"},{"alias_kind":"pith_short_8","alias_value":"4XX643Z5","created_at":"2026-05-18T12:31:00Z"}],"graph_snapshots":[{"event_id":"sha256:ba6b3f1e9a8c085e5224a479ad351196e8984005f669fefafb9a7631010ca4ec","target":"graph","created_at":"2026-05-18T00:53:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The problem of outlier detection is extremely challenging in many domains such as text, in which the attribute values are typically non-negative, and most values are zero. In such cases, it often becomes difficult to separate the outliers from the natural variations in the patterns in the underlying data. In this paper, we present a matrix factorization method, which is naturally able to distinguish the anomalies with the use of low rank approximations of the underlying data. Our iterative algorithm TONMF is based on block coordinate descent (BCD) framework. We define blocks over the term-docu","authors_text":"Charu C. Aggarwal, Haesun Park, Hyenkyun Woo, Ramakrishnan Kannan","cross_cats":["cs.LG","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2017-01-05T14:14:52Z","title":"Outlier Detection for Text Data : An Extended Version"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1701.01325","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:133025be55fa3800dc7eac7c8571b4a3925fd66718242bfc7340ab4befa9a395","target":"record","created_at":"2026-05-18T00:53:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9ce6bfcb1226afa0d45668fdb5bff3b4bec593147320427a57f9abb7d90f6663","cross_cats_sorted":["cs.LG","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2017-01-05T14:14:52Z","title_canon_sha256":"88c927bd8383fa79eca5f99de120bd33191e10ddd692bf9d0a7555e002fdf941"},"schema_version":"1.0","source":{"id":"1701.01325","kind":"arxiv","version":1}},"canonical_sha256":"e5efee6f3deac9099d2f9ba1a85cb9d132c74015dda3259aaef7c8cff758f2f5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e5efee6f3deac9099d2f9ba1a85cb9d132c74015dda3259aaef7c8cff758f2f5","first_computed_at":"2026-05-18T00:53:19.901759Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:53:19.901759Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"VHuHst0uS5QihCl16vVUXnBBpwGfMF/2z4rX2yTaQid66N8z9mQvEITd5KwEHgsXqav34bJAYVk21nSFX94vAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:53:19.902168Z","signed_message":"canonical_sha256_bytes"},"source_id":"1701.01325","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:133025be55fa3800dc7eac7c8571b4a3925fd66718242bfc7340ab4befa9a395","sha256:ba6b3f1e9a8c085e5224a479ad351196e8984005f669fefafb9a7631010ca4ec"],"state_sha256":"1bcdd25081945bae7a9519e5659d1847ab594a0b901a5c7dd83359b9a5c1cd5e"}