{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:IDS6QE63U3PK7XBWKZIS4IRV7I","short_pith_number":"pith:IDS6QE63","schema_version":"1.0","canonical_sha256":"40e5e813dba6deafdc3656512e2235fa2b524fb7ae1410cfb48e68faf15f58a6","source":{"kind":"arxiv","id":"1711.02326","version":1},"attestation_state":"computed","paper":{"title":"Sparse Attentive Backtracking: Long-Range Credit Assignment in Recurrent Networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","cs.NE","stat.ML"],"primary_cat":"cs.AI","authors_text":"Anirudh Goyal, Chris Pal, Jonathan Binas, Laurent Charlin, Nan Rosemary Ke, Olexa Bilaniuk, Yoshua Bengio","submitted_at":"2017-11-07T07:52:12Z","abstract_excerpt":"A major drawback of backpropagation through time (BPTT) is the difficulty of learning long-term dependencies, coming from having to propagate credit information backwards through every single step of the forward computation. This makes BPTT both computationally impractical and biologically implausible. For this reason, full backpropagation through time is rarely used on long sequences, and truncated backpropagation through time is used as a heuristic. However, this usually leads to biased estimates of the gradient in which longer term dependencies are ignored. Addressing this issue, we propose"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1711.02326","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-11-07T07:52:12Z","cross_cats_sorted":["cs.LG","cs.NE","stat.ML"],"title_canon_sha256":"c56a1dba08765d774092e8a24a05b4335feb457ab8493c192312df0968f57af9","abstract_canon_sha256":"97fc27ed91adc7d9173aa4bea486c84d8094ec5d19ad23f296c9e5a92a016d79"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:31:08.219726Z","signature_b64":"s9qliCrQ60j0ilrBiTSeuKBtn/74LmiW0/GMajqh9c6OFwwqyQ0BhxL9iw2bQwIjEqpclJ0zorXm1gGtol3QDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"40e5e813dba6deafdc3656512e2235fa2b524fb7ae1410cfb48e68faf15f58a6","last_reissued_at":"2026-05-18T00:31:08.219124Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:31:08.219124Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Sparse Attentive Backtracking: Long-Range Credit Assignment in Recurrent Networks","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","cs.NE","stat.ML"],"primary_cat":"cs.AI","authors_text":"Anirudh Goyal, Chris Pal, Jonathan Binas, Laurent Charlin, Nan Rosemary Ke, Olexa Bilaniuk, Yoshua Bengio","submitted_at":"2017-11-07T07:52:12Z","abstract_excerpt":"A major drawback of backpropagation through time (BPTT) is the difficulty of learning long-term dependencies, coming from having to propagate credit information backwards through every single step of the forward computation. This makes BPTT both computationally impractical and biologically implausible. For this reason, full backpropagation through time is rarely used on long sequences, and truncated backpropagation through time is used as a heuristic. However, this usually leads to biased estimates of the gradient in which longer term dependencies are ignored. Addressing this issue, we propose"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.02326","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1711.02326","created_at":"2026-05-18T00:31:08.219193+00:00"},{"alias_kind":"arxiv_version","alias_value":"1711.02326v1","created_at":"2026-05-18T00:31:08.219193+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.02326","created_at":"2026-05-18T00:31:08.219193+00:00"},{"alias_kind":"pith_short_12","alias_value":"IDS6QE63U3PK","created_at":"2026-05-18T12:31:21.493067+00:00"},{"alias_kind":"pith_short_16","alias_value":"IDS6QE63U3PK7XBW","created_at":"2026-05-18T12:31:21.493067+00:00"},{"alias_kind":"pith_short_8","alias_value":"IDS6QE63","created_at":"2026-05-18T12:31:21.493067+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I","json":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I.json","graph_json":"https://pith.science/api/pith-number/IDS6QE63U3PK7XBWKZIS4IRV7I/graph.json","events_json":"https://pith.science/api/pith-number/IDS6QE63U3PK7XBWKZIS4IRV7I/events.json","paper":"https://pith.science/paper/IDS6QE63"},"agent_actions":{"view_html":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I","download_json":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I.json","view_paper":"https://pith.science/paper/IDS6QE63","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1711.02326&json=true","fetch_graph":"https://pith.science/api/pith-number/IDS6QE63U3PK7XBWKZIS4IRV7I/graph.json","fetch_events":"https://pith.science/api/pith-number/IDS6QE63U3PK7XBWKZIS4IRV7I/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I/action/timestamp_anchor","attest_storage":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I/action/storage_attestation","attest_author":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I/action/author_attestation","sign_citation":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I/action/citation_signature","submit_replication":"https://pith.science/pith/IDS6QE63U3PK7XBWKZIS4IRV7I/action/replication_record"}},"created_at":"2026-05-18T00:31:08.219193+00:00","updated_at":"2026-05-18T00:31:08.219193+00:00"}