{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:DBG7USJ4IIW7B2HNXIXOIYFSQZ","short_pith_number":"pith:DBG7USJ4","canonical_record":{"source":{"id":"1805.03647","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2018-05-09T15:10:57Z","cross_cats_sorted":["cs.LG","eess.AS","stat.ML"],"title_canon_sha256":"b2ce2c96910fb1b7947896d41514584a200645c19b905bcb352080ac1907c9c4","abstract_canon_sha256":"b49e207a065b268eb0fea1d821c1cf53ce701cf74a9fb41634efe82a8746894d"},"schema_version":"1.0"},"canonical_sha256":"184dfa493c422df0e8edba2ee460b286718e9e285179514c33dae8196e1a5abd","source":{"kind":"arxiv","id":"1805.03647","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.03647","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"arxiv_version","alias_value":"1805.03647v1","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.03647","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"pith_short_12","alias_value":"DBG7USJ4IIW7","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"DBG7USJ4IIW7B2HN","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"DBG7USJ4","created_at":"2026-05-18T12:32:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:DBG7USJ4IIW7B2HNXIXOIYFSQZ","target":"record","payload":{"canonical_record":{"source":{"id":"1805.03647","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2018-05-09T15:10:57Z","cross_cats_sorted":["cs.LG","eess.AS","stat.ML"],"title_canon_sha256":"b2ce2c96910fb1b7947896d41514584a200645c19b905bcb352080ac1907c9c4","abstract_canon_sha256":"b49e207a065b268eb0fea1d821c1cf53ce701cf74a9fb41634efe82a8746894d"},"schema_version":"1.0"},"canonical_sha256":"184dfa493c422df0e8edba2ee460b286718e9e285179514c33dae8196e1a5abd","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:16:19.042011Z","signature_b64":"OVFjvUrTricgz+ofgPn3M1bcJd+EFzzIUqL1iF5Q3GnSlIGfuHzCUoTtVhc/wxNsrEdAQC8PHKSqLcEi/c5pAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"184dfa493c422df0e8edba2ee460b286718e9e285179514c33dae8196e1a5abd","last_reissued_at":"2026-05-18T00:16:19.041476Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:16:19.041476Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1805.03647","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:16:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Pc53ss7fU/eeaeJ5hvb0SwuHNmPRJlAbsxH7lmxFm29FD+BLxBg/JNTQP84r9KVh1YwspD0k9lBN8girTyC0DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T02:17:49.860866Z"},"content_sha256":"f845f98709d8280b1998970277b9fce592b813081229785eae371642678b0900","schema_version":"1.0","event_id":"sha256:f845f98709d8280b1998970277b9fce592b813081229785eae371642678b0900"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:DBG7USJ4IIW7B2HNXIXOIYFSQZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"End-to-End Polyphonic Sound Event Detection Using Convolutional Recurrent Neural Networks with Learned Time-Frequency Representation Input","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","eess.AS","stat.ML"],"primary_cat":"cs.SD","authors_text":"Emre \\c{C}ak{\\i}r, Tuomas Virtanen","submitted_at":"2018-05-09T15:10:57Z","abstract_excerpt":"Sound event detection systems typically consist of two stages: extracting hand-crafted features from the raw audio waveform, and learning a mapping between these features and the target sound events using a classifier. Recently, the focus of sound event detection research has been mostly shifted to the latter stage using standard features such as mel spectrogram as the input for classifiers such as deep neural networks. In this work, we utilize end-to-end approach and propose to combine these two stages in a single deep neural network classifier. The feature extraction over the raw waveform is"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.03647","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:16:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"w2o/YeK+D177w13Vkf371WFeXHkkfdbLy6rtWZnprr+Oa1Dfvl+CY2R7w1Wgyf2Ty3GASjAuSJiNhYq4+YNoBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T02:17:49.861613Z"},"content_sha256":"8e90e267fb7f0ca40b4dcb787a5cd18475f074b0fbf2a6dca6e10b6f19085cd3","schema_version":"1.0","event_id":"sha256:8e90e267fb7f0ca40b4dcb787a5cd18475f074b0fbf2a6dca6e10b6f19085cd3"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/bundle.json","state_url":"https://pith.science/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T02:17:49Z","links":{"resolver":"https://pith.science/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ","bundle":"https://pith.science/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/bundle.json","state":"https://pith.science/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DBG7USJ4IIW7B2HNXIXOIYFSQZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:DBG7USJ4IIW7B2HNXIXOIYFSQZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b49e207a065b268eb0fea1d821c1cf53ce701cf74a9fb41634efe82a8746894d","cross_cats_sorted":["cs.LG","eess.AS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2018-05-09T15:10:57Z","title_canon_sha256":"b2ce2c96910fb1b7947896d41514584a200645c19b905bcb352080ac1907c9c4"},"schema_version":"1.0","source":{"id":"1805.03647","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.03647","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"arxiv_version","alias_value":"1805.03647v1","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.03647","created_at":"2026-05-18T00:16:19Z"},{"alias_kind":"pith_short_12","alias_value":"DBG7USJ4IIW7","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"DBG7USJ4IIW7B2HN","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"DBG7USJ4","created_at":"2026-05-18T12:32:19Z"}],"graph_snapshots":[{"event_id":"sha256:8e90e267fb7f0ca40b4dcb787a5cd18475f074b0fbf2a6dca6e10b6f19085cd3","target":"graph","created_at":"2026-05-18T00:16:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Sound event detection systems typically consist of two stages: extracting hand-crafted features from the raw audio waveform, and learning a mapping between these features and the target sound events using a classifier. Recently, the focus of sound event detection research has been mostly shifted to the latter stage using standard features such as mel spectrogram as the input for classifiers such as deep neural networks. In this work, we utilize end-to-end approach and propose to combine these two stages in a single deep neural network classifier. The feature extraction over the raw waveform is","authors_text":"Emre \\c{C}ak{\\i}r, Tuomas Virtanen","cross_cats":["cs.LG","eess.AS","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2018-05-09T15:10:57Z","title":"End-to-End Polyphonic Sound Event Detection Using Convolutional Recurrent Neural Networks with Learned Time-Frequency Representation Input"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.03647","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f845f98709d8280b1998970277b9fce592b813081229785eae371642678b0900","target":"record","created_at":"2026-05-18T00:16:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b49e207a065b268eb0fea1d821c1cf53ce701cf74a9fb41634efe82a8746894d","cross_cats_sorted":["cs.LG","eess.AS","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SD","submitted_at":"2018-05-09T15:10:57Z","title_canon_sha256":"b2ce2c96910fb1b7947896d41514584a200645c19b905bcb352080ac1907c9c4"},"schema_version":"1.0","source":{"id":"1805.03647","kind":"arxiv","version":1}},"canonical_sha256":"184dfa493c422df0e8edba2ee460b286718e9e285179514c33dae8196e1a5abd","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"184dfa493c422df0e8edba2ee460b286718e9e285179514c33dae8196e1a5abd","first_computed_at":"2026-05-18T00:16:19.041476Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:16:19.041476Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"OVFjvUrTricgz+ofgPn3M1bcJd+EFzzIUqL1iF5Q3GnSlIGfuHzCUoTtVhc/wxNsrEdAQC8PHKSqLcEi/c5pAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:16:19.042011Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.03647","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f845f98709d8280b1998970277b9fce592b813081229785eae371642678b0900","sha256:8e90e267fb7f0ca40b4dcb787a5cd18475f074b0fbf2a6dca6e10b6f19085cd3"],"state_sha256":"b5bcd2ba6aa4cecf7b5e80336c8d6392ca1df8c893141bfa779ccba501ee96da"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/ZAwR82yBwjQMaeSEB2VXPglZZoeWB0zH68A5RzKibliPy1Kyi7ZRKkUctvM5dpZlhcoh6kEUNGobU1cZVU5BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T02:17:49.865597Z","bundle_sha256":"705971d0e351cbb8d678a05a995856f6e678d91ad7046b3eaa99ec925c248fc6"}}