{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ORLXT7H7W6HBNYVZWD3VCK3WL5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3fc6e77252e8c131786e8d1a175a575513ca59eb68a77d382d3cc61dea0e5d45","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-03-11T18:13:01Z","title_canon_sha256":"034ac9d1a2343460c80aaeba9b03d0344e1fbfbcb6dbbb390c22a1fd5f9417e5"},"schema_version":"1.0","source":{"id":"1803.04000","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.04000","created_at":"2026-05-18T00:21:33Z"},{"alias_kind":"arxiv_version","alias_value":"1803.04000v1","created_at":"2026-05-18T00:21:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.04000","created_at":"2026-05-18T00:21:33Z"},{"alias_kind":"pith_short_12","alias_value":"ORLXT7H7W6HB","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"ORLXT7H7W6HBNYVZ","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"ORLXT7H7","created_at":"2026-05-18T12:32:43Z"}],"graph_snapshots":[{"event_id":"sha256:ede06b0f481bc94e5d95e289f092429fe4d6eb4fcef00ffb66534bcfa90a8d90","target":"graph","created_at":"2026-05-18T00:21:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Analysis of informative contents and sentiments of social users has been attempted quite intensively in the recent past. Most of the systems are usable only for monolingual data and fails or gives poor results when used on data with code-mixing property. To gather attention and encourage researchers to work on this crisis, we prepared gold standard Bengali-English code-mixed data with language and polarity tag for sentiment analysis purposes. In this paper, we discuss the systems we prepared to collect and filter raw Twitter data. In order to reduce manual work while annotation, hybrid systems","authors_text":"Dipankar Das, Sainik Kumar Mahata, Soumil Mandal","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-03-11T18:13:01Z","title":"Preparing Bengali-English Code-Mixed Corpus for Sentiment Analysis of Indian Languages"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.04000","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4b692fd746f1448d3265ae3bba9bb8a073bb3ca6d2603f73b6527b8afbf555d8","target":"record","created_at":"2026-05-18T00:21:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3fc6e77252e8c131786e8d1a175a575513ca59eb68a77d382d3cc61dea0e5d45","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2018-03-11T18:13:01Z","title_canon_sha256":"034ac9d1a2343460c80aaeba9b03d0344e1fbfbcb6dbbb390c22a1fd5f9417e5"},"schema_version":"1.0","source":{"id":"1803.04000","kind":"arxiv","version":1}},"canonical_sha256":"745779fcffb78e16e2b9b0f7512b765f6e42d33e4635169af3bb34ac2bd265af","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"745779fcffb78e16e2b9b0f7512b765f6e42d33e4635169af3bb34ac2bd265af","first_computed_at":"2026-05-18T00:21:33.223234Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:21:33.223234Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ClgzFfE8ehdop4L1l9JbBo5ECWurPn3qE7qgnJDcbgGaX7xzU6sZ0k4sV8wgSAwxH5Yq8amD3V53yNWzXzwWAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:21:33.223950Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.04000","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4b692fd746f1448d3265ae3bba9bb8a073bb3ca6d2603f73b6527b8afbf555d8","sha256:ede06b0f481bc94e5d95e289f092429fe4d6eb4fcef00ffb66534bcfa90a8d90"],"state_sha256":"1839efddb4d4e21f74259bdad25924b8e4aca7b437df0674011f834286d5ffe7"}