{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2015:YH2KD5RTUWPESQX7NQUFRID7CD","short_pith_number":"pith:YH2KD5RT","schema_version":"1.0","canonical_sha256":"c1f4a1f633a59e4942ff6c2858a07f10e297b81079722a878b97255bb16c4ba4","source":{"kind":"arxiv","id":"1508.05367","version":2},"attestation_state":"computed","paper":{"title":"Hidden Markov Models for Gene Sequence Classification: Classifying the VSG genes in the Trypanosoma brucei Genome","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CE","cs.LG"],"primary_cat":"q-bio.GN","authors_text":"Andrea Mesa, Fernando Alvarez-Valin, Gustavo Guerberoff, Sebasti\\'an Basterrech","submitted_at":"2015-07-31T14:57:09Z","abstract_excerpt":"The article presents an application of Hidden Markov Models (HMMs) for pattern recognition on genome sequences. We apply HMM for identifying genes encoding the Variant Surface Glycoprotein (VSG) in the genomes of Trypanosoma brucei (T. brucei) and other African trypanosomes. These are parasitic protozoa causative agents of sleeping sickness and several diseases in domestic and wild animals. These parasites have a peculiar strategy to evade the host's immune system that consists in periodically changing their predominant cellular surface protein (VSG). The motivation for using patterns recognit"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1508.05367","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.GN","submitted_at":"2015-07-31T14:57:09Z","cross_cats_sorted":["cs.CE","cs.LG"],"title_canon_sha256":"c18ab5af8a532a7cdf7e2bc61f2a5abb9016aa9cad0c7bae6c7a081856770266","abstract_canon_sha256":"6b4b22b3160ac3f37c71b3066fdada3fd135c10e0a8d1bb92de862c7bf179729"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:29:37.991611Z","signature_b64":"kKW3SyOAs+NNi413hWRaAnQtKGi9swULDIZq5CufFU3tQuCQJ4wMxd1BD4hXJ/eOcdBuFkJsQbH+5UywKzlTAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c1f4a1f633a59e4942ff6c2858a07f10e297b81079722a878b97255bb16c4ba4","last_reissued_at":"2026-05-18T01:29:37.991165Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:29:37.991165Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Hidden Markov Models for Gene Sequence Classification: Classifying the VSG genes in the Trypanosoma brucei Genome","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CE","cs.LG"],"primary_cat":"q-bio.GN","authors_text":"Andrea Mesa, Fernando Alvarez-Valin, Gustavo Guerberoff, Sebasti\\'an Basterrech","submitted_at":"2015-07-31T14:57:09Z","abstract_excerpt":"The article presents an application of Hidden Markov Models (HMMs) for pattern recognition on genome sequences. We apply HMM for identifying genes encoding the Variant Surface Glycoprotein (VSG) in the genomes of Trypanosoma brucei (T. brucei) and other African trypanosomes. These are parasitic protozoa causative agents of sleeping sickness and several diseases in domestic and wild animals. These parasites have a peculiar strategy to evade the host's immune system that consists in periodically changing their predominant cellular surface protein (VSG). The motivation for using patterns recognit"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.05367","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1508.05367","created_at":"2026-05-18T01:29:37.991236+00:00"},{"alias_kind":"arxiv_version","alias_value":"1508.05367v2","created_at":"2026-05-18T01:29:37.991236+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.05367","created_at":"2026-05-18T01:29:37.991236+00:00"},{"alias_kind":"pith_short_12","alias_value":"YH2KD5RTUWPE","created_at":"2026-05-18T12:29:50.041715+00:00"},{"alias_kind":"pith_short_16","alias_value":"YH2KD5RTUWPESQX7","created_at":"2026-05-18T12:29:50.041715+00:00"},{"alias_kind":"pith_short_8","alias_value":"YH2KD5RT","created_at":"2026-05-18T12:29:50.041715+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD","json":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD.json","graph_json":"https://pith.science/api/pith-number/YH2KD5RTUWPESQX7NQUFRID7CD/graph.json","events_json":"https://pith.science/api/pith-number/YH2KD5RTUWPESQX7NQUFRID7CD/events.json","paper":"https://pith.science/paper/YH2KD5RT"},"agent_actions":{"view_html":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD","download_json":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD.json","view_paper":"https://pith.science/paper/YH2KD5RT","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1508.05367&json=true","fetch_graph":"https://pith.science/api/pith-number/YH2KD5RTUWPESQX7NQUFRID7CD/graph.json","fetch_events":"https://pith.science/api/pith-number/YH2KD5RTUWPESQX7NQUFRID7CD/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD/action/timestamp_anchor","attest_storage":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD/action/storage_attestation","attest_author":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD/action/author_attestation","sign_citation":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD/action/citation_signature","submit_replication":"https://pith.science/pith/YH2KD5RTUWPESQX7NQUFRID7CD/action/replication_record"}},"created_at":"2026-05-18T01:29:37.991236+00:00","updated_at":"2026-05-18T01:29:37.991236+00:00"}