{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:IK7TEGSW4ODN7YT7UJVK3EM73O","short_pith_number":"pith:IK7TEGSW","schema_version":"1.0","canonical_sha256":"42bf321a56e386dfe27fa26aad919fdbac22fbb46e58af4c88f37d1084784ad3","source":{"kind":"arxiv","id":"1611.03777","version":1},"attestation_state":"computed","paper":{"title":"Tricks from Deep Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"At{\\i}l{\\i}m G\\\"une\\c{s} Baydin, Barak A. Pearlmutter, Jeffrey Mark Siskind","submitted_at":"2016-11-10T17:57:19Z","abstract_excerpt":"The deep learning community has devised a diverse set of methods to make gradient optimization, using large datasets, of large and highly complex models with deeply cascaded nonlinearities, practical. Taken as a whole, these methods constitute a breakthrough, allowing computational structures which are quite wide, very deep, and with an enormous number and variety of free parameters to be effectively optimized. The result now dominates much of practical machine learning, with applications in machine translation, computer vision, and speech recognition. Many of these methods, viewed through the"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1611.03777","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-10T17:57:19Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"aa6ac034abf574c71c34c22af281cd3325e70f0d712c74611e8cebd21935963c","abstract_canon_sha256":"f8e33f42c4517eb5ad5e1543d3b07d96293726dc9e629aaef99bb2b4dddca1f9"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:59:33.361667Z","signature_b64":"zz2VrKEeGxa1vw50Hqi2CZdrC0UMVh91RMpZpsrIW5CKDvjEQWOE9J/g7r4yCFhFHhox0fzxr0OJ9NIcBFUPAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"42bf321a56e386dfe27fa26aad919fdbac22fbb46e58af4c88f37d1084784ad3","last_reissued_at":"2026-05-18T00:59:33.360981Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:59:33.360981Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Tricks from Deep Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"At{\\i}l{\\i}m G\\\"une\\c{s} Baydin, Barak A. Pearlmutter, Jeffrey Mark Siskind","submitted_at":"2016-11-10T17:57:19Z","abstract_excerpt":"The deep learning community has devised a diverse set of methods to make gradient optimization, using large datasets, of large and highly complex models with deeply cascaded nonlinearities, practical. Taken as a whole, these methods constitute a breakthrough, allowing computational structures which are quite wide, very deep, and with an enormous number and variety of free parameters to be effectively optimized. The result now dominates much of practical machine learning, with applications in machine translation, computer vision, and speech recognition. Many of these methods, viewed through the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.03777","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1611.03777","created_at":"2026-05-18T00:59:33.361096+00:00"},{"alias_kind":"arxiv_version","alias_value":"1611.03777v1","created_at":"2026-05-18T00:59:33.361096+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.03777","created_at":"2026-05-18T00:59:33.361096+00:00"},{"alias_kind":"pith_short_12","alias_value":"IK7TEGSW4ODN","created_at":"2026-05-18T12:30:22.444734+00:00"},{"alias_kind":"pith_short_16","alias_value":"IK7TEGSW4ODN7YT7","created_at":"2026-05-18T12:30:22.444734+00:00"},{"alias_kind":"pith_short_8","alias_value":"IK7TEGSW","created_at":"2026-05-18T12:30:22.444734+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O","json":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O.json","graph_json":"https://pith.science/api/pith-number/IK7TEGSW4ODN7YT7UJVK3EM73O/graph.json","events_json":"https://pith.science/api/pith-number/IK7TEGSW4ODN7YT7UJVK3EM73O/events.json","paper":"https://pith.science/paper/IK7TEGSW"},"agent_actions":{"view_html":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O","download_json":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O.json","view_paper":"https://pith.science/paper/IK7TEGSW","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1611.03777&json=true","fetch_graph":"https://pith.science/api/pith-number/IK7TEGSW4ODN7YT7UJVK3EM73O/graph.json","fetch_events":"https://pith.science/api/pith-number/IK7TEGSW4ODN7YT7UJVK3EM73O/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O/action/timestamp_anchor","attest_storage":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O/action/storage_attestation","attest_author":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O/action/author_attestation","sign_citation":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O/action/citation_signature","submit_replication":"https://pith.science/pith/IK7TEGSW4ODN7YT7UJVK3EM73O/action/replication_record"}},"created_at":"2026-05-18T00:59:33.361096+00:00","updated_at":"2026-05-18T00:59:33.361096+00:00"}