{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:R4WNXXNG3SJBDPMMBSAF3SI2N4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"592169d42d57f67f5a6d76ca87df63e690ff3ede6689e76fe62f1c8a6601d97e","cross_cats_sorted":["cs.AI","cs.CL","cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2016-08-29T18:45:00Z","title_canon_sha256":"f711a78f5acb74f316f7aa0ce5f7f4a26cb6b75a24e49770d5c35d7f125d15e4"},"schema_version":"1.0","source":{"id":"1608.08176","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1608.08176","created_at":"2026-05-18T00:20:57Z"},{"alias_kind":"arxiv_version","alias_value":"1608.08176v4","created_at":"2026-05-18T00:20:57Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1608.08176","created_at":"2026-05-18T00:20:57Z"},{"alias_kind":"pith_short_12","alias_value":"R4WNXXNG3SJB","created_at":"2026-05-18T12:30:41Z"},{"alias_kind":"pith_short_16","alias_value":"R4WNXXNG3SJBDPMM","created_at":"2026-05-18T12:30:41Z"},{"alias_kind":"pith_short_8","alias_value":"R4WNXXNG","created_at":"2026-05-18T12:30:41Z"}],"graph_snapshots":[{"event_id":"sha256:fa20064e41d0d79407030caa6e25a792d988f8fee478e73020c4cd5a976fe226","target":"graph","created_at":"2026-05-18T00:20:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Context: Topic modeling finds human-readable structures in unstructured textual data. A widely used topic modeler is Latent Dirichlet allocation. When run on different datasets, LDA suffers from \"order effects\" i.e. different topics are generated if the order of training data is shuffled. Such order effects introduce a systematic error for any study. This error can relate to misleading results;specifically, inaccurate topic descriptions and a reduction in the efficacy of text mining classification results. Objective: To provide a method in which distributions generated by LDA are more stable a","authors_text":"Amritanshu Agrawal, Tim Menzies, Wei Fu","cross_cats":["cs.AI","cs.CL","cs.IR"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2016-08-29T18:45:00Z","title":"What is Wrong with Topic Modeling? (and How to Fix it Using Search-based Software Engineering)"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1608.08176","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:98bdb68a1b153ad25f9e54ef299053c159b07c336c8f051da2d5a4056d23d832","target":"record","created_at":"2026-05-18T00:20:57Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"592169d42d57f67f5a6d76ca87df63e690ff3ede6689e76fe62f1c8a6601d97e","cross_cats_sorted":["cs.AI","cs.CL","cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2016-08-29T18:45:00Z","title_canon_sha256":"f711a78f5acb74f316f7aa0ce5f7f4a26cb6b75a24e49770d5c35d7f125d15e4"},"schema_version":"1.0","source":{"id":"1608.08176","kind":"arxiv","version":4}},"canonical_sha256":"8f2cdbdda6dc9211bd8c0c805dc91a6f18cd98e2cd6f6aa4dd11f892ee791ce5","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8f2cdbdda6dc9211bd8c0c805dc91a6f18cd98e2cd6f6aa4dd11f892ee791ce5","first_computed_at":"2026-05-18T00:20:57.282437Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:20:57.282437Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ENdy7+zRE0fm8gNGT/BH8HZlws7B9gubSyOoXS2pcZe2qME35oGfMOGL1WHusPnG6lAW8jNWX+dEmBfReGMEDg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:20:57.283098Z","signed_message":"canonical_sha256_bytes"},"source_id":"1608.08176","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:98bdb68a1b153ad25f9e54ef299053c159b07c336c8f051da2d5a4056d23d832","sha256:fa20064e41d0d79407030caa6e25a792d988f8fee478e73020c4cd5a976fe226"],"state_sha256":"08907e59ad2b1a9413cacc3e9e2e895228194d8d95114dadb98f3529e7bbd508"}