{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2020:IIYGQSUQEORR4ZCQU36RVUA6LW","short_pith_number":"pith:IIYGQSUQ","canonical_record":{"source":{"id":"2004.04270","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-04-08T21:25:00Z","cross_cats_sorted":[],"title_canon_sha256":"faa290e033d5fd4bf3c44b1513c81882a1f5354f654d26ef333735ac86806356","abstract_canon_sha256":"064632c9533a80ee0e31f66652a6df13344fbf2c45f6eb9c370dbefe975d84c3"},"schema_version":"1.0"},"canonical_sha256":"4230684a9023a31e6450a6fd1ad01e5dbcf81cba8562d4302ffdd090658dc97e","source":{"kind":"arxiv","id":"2004.04270","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2004.04270","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"arxiv_version","alias_value":"2004.04270v3","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2004.04270","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_12","alias_value":"IIYGQSUQEORR","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_16","alias_value":"IIYGQSUQEORR4ZCQ","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_8","alias_value":"IIYGQSUQ","created_at":"2026-07-05T01:57:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2020:IIYGQSUQEORR4ZCQU36RVUA6LW","target":"record","payload":{"canonical_record":{"source":{"id":"2004.04270","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-04-08T21:25:00Z","cross_cats_sorted":[],"title_canon_sha256":"faa290e033d5fd4bf3c44b1513c81882a1f5354f654d26ef333735ac86806356","abstract_canon_sha256":"064632c9533a80ee0e31f66652a6df13344fbf2c45f6eb9c370dbefe975d84c3"},"schema_version":"1.0"},"canonical_sha256":"4230684a9023a31e6450a6fd1ad01e5dbcf81cba8562d4302ffdd090658dc97e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T01:57:16.068575Z","signature_b64":"OG1XO3e4GGAKb/5tNsRhUnFxMjkt9PoiCXA87qO7WM3rbN0eQs79zf8OC5Sn/UesDyw848pT0eNBUhjWzETCAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4230684a9023a31e6450a6fd1ad01e5dbcf81cba8562d4302ffdd090658dc97e","last_reissued_at":"2026-07-05T01:57:16.068098Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T01:57:16.068098Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2004.04270","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:57:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2rRql7D8C4lIAR5iXluBcfNHn0t06mEHLy+8Nkjr01O1u2dEDR0PlQTKYDXGH9cX/7CPSsSQTu+Vd07UmXtQBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T10:43:12.832269Z"},"content_sha256":"c088c6aff29fe1a0ce49ad80c296a8d8ea205e3ac411192ee5f4f00dbbb066be","schema_version":"1.0","event_id":"sha256:c088c6aff29fe1a0ce49ad80c296a8d8ea205e3ac411192ee5f4f00dbbb066be"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2020:IIYGQSUQEORR4ZCQU36RVUA6LW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"The Spotify Podcast Dataset","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Aasish Pappu, Ann Clifton, Ben Carterette, Jussi Karlgren, Rosie Jones, Sravana Reddy, Yongze Yu","submitted_at":"2020-04-08T21:25:00Z","abstract_excerpt":"Podcasts are a relatively new form of audio media. Episodes appear on a regular cadence, and come in many different formats and levels of formality. They can be formal news journalism or conversational chat; fiction or non-fiction. They are rapidly growing in popularity and yet have been relatively little studied. As an audio format, podcasts are more varied in style and production types than, say, broadcast news, and contain many more genres than typically studied in video research. The medium is therefore a rich domain with many research avenues for the IR and NLP communities. We present the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2004.04270","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2004.04270/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T01:57:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"DdBp9+NOlv/kx0X4J8qn3Hmc7wAeTn4SYoZq/jidf0/LDDNMql+m+M+rCX2JnEdEcqgSdOlzchFEmPCoVDU3Bg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T10:43:12.832660Z"},"content_sha256":"42fe1e0e835afa5f72dc048cd5c99663e495c171cf3e935b49bf46f38a0680ce","schema_version":"1.0","event_id":"sha256:42fe1e0e835afa5f72dc048cd5c99663e495c171cf3e935b49bf46f38a0680ce"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/bundle.json","state_url":"https://pith.science/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T10:43:12Z","links":{"resolver":"https://pith.science/pith/IIYGQSUQEORR4ZCQU36RVUA6LW","bundle":"https://pith.science/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/bundle.json","state":"https://pith.science/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/IIYGQSUQEORR4ZCQU36RVUA6LW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2020:IIYGQSUQEORR4ZCQU36RVUA6LW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"064632c9533a80ee0e31f66652a6df13344fbf2c45f6eb9c370dbefe975d84c3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-04-08T21:25:00Z","title_canon_sha256":"faa290e033d5fd4bf3c44b1513c81882a1f5354f654d26ef333735ac86806356"},"schema_version":"1.0","source":{"id":"2004.04270","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2004.04270","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"arxiv_version","alias_value":"2004.04270v3","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2004.04270","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_12","alias_value":"IIYGQSUQEORR","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_16","alias_value":"IIYGQSUQEORR4ZCQ","created_at":"2026-07-05T01:57:16Z"},{"alias_kind":"pith_short_8","alias_value":"IIYGQSUQ","created_at":"2026-07-05T01:57:16Z"}],"graph_snapshots":[{"event_id":"sha256:42fe1e0e835afa5f72dc048cd5c99663e495c171cf3e935b49bf46f38a0680ce","target":"graph","created_at":"2026-07-05T01:57:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2004.04270/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Podcasts are a relatively new form of audio media. Episodes appear on a regular cadence, and come in many different formats and levels of formality. They can be formal news journalism or conversational chat; fiction or non-fiction. They are rapidly growing in popularity and yet have been relatively little studied. As an audio format, podcasts are more varied in style and production types than, say, broadcast news, and contain many more genres than typically studied in video research. The medium is therefore a rich domain with many research avenues for the IR and NLP communities. We present the","authors_text":"Aasish Pappu, Ann Clifton, Ben Carterette, Jussi Karlgren, Rosie Jones, Sravana Reddy, Yongze Yu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-04-08T21:25:00Z","title":"The Spotify Podcast Dataset"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2004.04270","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c088c6aff29fe1a0ce49ad80c296a8d8ea205e3ac411192ee5f4f00dbbb066be","target":"record","created_at":"2026-07-05T01:57:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"064632c9533a80ee0e31f66652a6df13344fbf2c45f6eb9c370dbefe975d84c3","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2020-04-08T21:25:00Z","title_canon_sha256":"faa290e033d5fd4bf3c44b1513c81882a1f5354f654d26ef333735ac86806356"},"schema_version":"1.0","source":{"id":"2004.04270","kind":"arxiv","version":3}},"canonical_sha256":"4230684a9023a31e6450a6fd1ad01e5dbcf81cba8562d4302ffdd090658dc97e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4230684a9023a31e6450a6fd1ad01e5dbcf81cba8562d4302ffdd090658dc97e","first_computed_at":"2026-07-05T01:57:16.068098Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T01:57:16.068098Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"OG1XO3e4GGAKb/5tNsRhUnFxMjkt9PoiCXA87qO7WM3rbN0eQs79zf8OC5Sn/UesDyw848pT0eNBUhjWzETCAg==","signature_status":"signed_v1","signed_at":"2026-07-05T01:57:16.068575Z","signed_message":"canonical_sha256_bytes"},"source_id":"2004.04270","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c088c6aff29fe1a0ce49ad80c296a8d8ea205e3ac411192ee5f4f00dbbb066be","sha256:42fe1e0e835afa5f72dc048cd5c99663e495c171cf3e935b49bf46f38a0680ce"],"state_sha256":"686563f5fec59393d9b285cd61c9faeb338fd0df9cd080aedcfe626f101be606"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cDqNY9lDfGZVN6TE84Z3m8i+ABB7HmkEXhyuTcw/2ELGbpN7DLOqy9A8PQA5s2H0/rk0rzcjFz3Z4RqOd4Y6Bg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T10:43:12.834860Z","bundle_sha256":"56936070d755b40cc641972f2a98b13a710c6db62173df58ffdf01984c062915"}}