{"work":{"id":"9a41dfbd-d7c8-4b32-943f-59c08fdd6db7","openalex_id":"https://openalex.org/W1861492603","doi":"10.1007/978-3-319-10602-1_48","arxiv_id":null,"raw_key":null,"title":"Microsoft COCO: common objects in context,","authors":[{"given":"Tsung-Yi","family":"Lin","sequence":"first","affiliation":[]},{"given":"Michael","family":"Maire","sequence":"additional","affiliation":[]},{"given":"Serge","family":"Belongie","sequence":"additional","affiliation":[]},{"given":"James","family":"Hays","sequence":"additional","affiliation":[]},{"given":"Pietro","family":"Perona","sequence":"additional","affiliation":[]},{"given":"Deva","family":"Ramanan","sequence":"additional","affiliation":[]},{"given":"Piotr","family":"Dollár","sequence":"additional","affiliation":[]},{"given":"C. Lawrence","family":"Zitnick","sequence":"additional","affiliation":[]}],"authors_text":"T","year":2014,"venue":"Lecture Notes in Computer Science","abstract":null,"external_url":"https://doi.org/10.1007/978-3-319-10602-1_48","cited_by_count":24966,"metadata_source":"doi_reference","metadata_fetched_at":"2026-05-25T04:25:18.804156+00:00","pith_arxiv_id":null,"created_at":"2026-05-08T18:33:59.304533+00:00","updated_at":"2026-05-25T04:25:18.804156+00:00","title_quality_ok":true,"display_title":"Lawrence Zitnick","render_title":"Lawrence Zitnick"},"hub":{"state":{"work_id":"9a41dfbd-d7c8-4b32-943f-59c08fdd6db7","tier":"super_hub","tier_reason":"100+ Pith inbound or 10,000+ external citations","pith_inbound_count":21,"external_cited_by_count":24966,"distinct_field_count":7,"first_pith_cited_at":"2024-03-05T18:45:39+00:00","last_pith_cited_at":"2026-05-22T17:21:06+00:00","author_build_status":"needed","summary_status":"needed","contexts_status":"needed","graph_status":"needed","ask_index_status":"needed","reader_status":"not_needed","recognition_status":"not_needed","updated_at":"2026-06-03T16:56:13.956193+00:00","tier_text":"super_hub"},"tier":"super_hub","role_counts":[{"context_role":"background","n":3},{"context_role":"dataset","n":3}],"polarity_counts":[{"context_polarity":"background","n":4},{"context_polarity":"use_dataset","n":2}],"runs":{"ask_index":{"job_type":"ask_index","status":"succeeded","result":{"title":"Lawrence Zitnick","claims":[],"why_cited":"Pith tracks Lawrence Zitnick because it crossed a citation-hub threshold.","role_counts":[]},"error":null,"updated_at":"2026-05-14T03:46:05.311995+00:00"},"author_expand":{"job_type":"author_expand","status":"succeeded","result":{"authors_linked":[{"id":"00e2756c-d70b-49a9-b019-ad42b25d5fab","orcid":null,"display_name":"Tsung-Yi Lin"},{"id":"4cdcb464-a6d3-44b3-a8fe-9e19975a8c9f","orcid":null,"display_name":"Michael Maire"},{"id":"36afc0d9-76dd-4868-9798-8e85bf567350","orcid":null,"display_name":"Serge Belongie"},{"id":"688e76cc-a7a9-4957-a415-5ad7189d073f","orcid":null,"display_name":"James Hays"},{"id":"46597a21-9794-47fe-a568-b329b5dee25f","orcid":null,"display_name":"Pietro Perona"},{"id":"357117ed-8a94-478b-93d0-35124e4d9a73","orcid":null,"display_name":"Deva Ramanan"},{"id":"9673a109-8699-40f3-b9a4-3da58f8bdde6","orcid":null,"display_name":"Piotr Dollár"},{"id":"594baa5f-8b5f-49d9-893d-80f061c4a41a","orcid":null,"display_name":"C. Lawrence Zitnick"}]},"error":null,"updated_at":"2026-05-14T03:46:07.131251+00:00"},"context_extract":{"job_type":"context_extract","status":"succeeded","result":{"enqueued_papers":25},"error":null,"updated_at":"2026-05-14T03:36:13.114485+00:00"},"graph_features":{"job_type":"graph_features","status":"succeeded","result":{"co_cited":[{"title":"Masked autoencoders are scalable vision learners","work_id":"0a23d1b7-bd56-43cc-8a80-7c43ce994e1e","shared_citers":4},{"title":"& Vondrick, C","work_id":"b8a8bb9e-1d31-40e2-9cab-ae21e338dde6","shared_citers":4},{"title":"Eyes Wide Shut? Exploring the Visual Shortcomings of Multimodal LLMs","work_id":"7efbc2dd-b0f2-4f71-bb1c-d2fcf110d805","shared_citers":2},{"title":"Feature Pyramid Networks for Object Detection","work_id":"dde3fe4f-1210-48b9-851c-ba5177fe8ffb","shared_citers":2},{"title":"Heinig, K","work_id":"cf4c4e77-acaa-46b4-b066-ddf045165d05","shared_citers":2},{"title":"In: 2023 IEEE/CVF International Conference on Computer Vision (ICCV)","work_id":"2a2d1133-ca8a-44c4-a105-9e5f80354b38","shared_citers":2},{"title":"In: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","work_id":"5674e43c-0bd6-4797-9061-d3bd7ec0850f","shared_citers":2},{"title":"In: Proceedings of the IEEE/CVF International Conference on Computer Vision, pp","work_id":"ed935943-7859-442f-aee2-2a1bfda624d4","shared_citers":2},{"title":"Microsoft COCO Captions: Data Collection and Evaluation Server","work_id":"b3d6fb46-4169-4a28-8f7e-2ca6774211da","shared_citers":2},{"title":"Qwen2.5-VL Technical Report","work_id":"69dffacb-bfe8-442d-be86-48624c60426f","shared_citers":2},{"title":"Tomasi and R","work_id":"135418b1-cafd-49fd-803d-1ca6433d4b1b","shared_citers":2},{"title":"URLhttp://dx.doi.org/10.1109/CVPR.2016.90","work_id":"b353bda2-591d-479a-9c8b-22dfcba12431","shared_citers":2},{"title":"You Only Look Once: Unified, Real-Time Object Detection","work_id":"37ab4f11-9f69-480d-aab9-e7d9826c586d","shared_citers":2},{"title":"1768 , publisher=","work_id":"b5ff924c-4267-4b08-8c95-566ceb3bab96","shared_citers":1},{"title":"1981.Multiple Attribute Decision Making: Methods and Applications","work_id":"7698541c-ce5a-4ef7-b576-ceae0dcc5e63","shared_citers":1},{"title":"2008 , url=","work_id":"0ce6a061-cd10-461d-9646-57e211c62876","shared_citers":1},{"title":"2010, Classical and Quantum Gravity, 27, 084013, doi: 10.1088/0264-9381/27/8/084013","work_id":"aa092362-d6ae-447d-b2ca-7848b8743d54","shared_citers":1},{"title":"2010, in Proceedings of COMPSTAT’2010: 19th International Conference on Computational Statistics, Springer, 177–186, doi: 10.1007/978-3-7908-2604-3_16","work_id":"87a76526-2ebb-424d-85ac-8c96da34f3bd","shared_citers":1},{"title":"2011, International Journal of Modern Physics D, 20, 989, doi: 10.1142/S0218271811019335","work_id":"e3eb42a2-83d5-436d-a9af-658cac917ad0","shared_citers":1},{"title":"2016, in 2016 Fourth International Conference on 3D Vision (3DV), IEEE, 565–571, doi: 10.1109/3DV.2016.79","work_id":"43e6c945-3b53-46f1-b9c3-b53708f491c3","shared_citers":1},{"title":"2017, Astronomy and Computing, 18, 35, doi: 10.1016/j.ascom.2017.01.002","work_id":"02b908e1-075e-47d6-899a-fba0ff00454c","shared_citers":1},{"title":"2017 , eprint=","work_id":"2c923374-2fee-4c42-a0f9-f706b8a72242","shared_citers":1},{"title":"2017 , eprint=","work_id":"72d4171a-6c4c-41a9-b5b1-a38637a23f93","shared_citers":1},{"title":"2017, in Proceedings of the IEEE International Conference on Computer Vision, 2961–2969, doi: 10.1109/ICCV.2017.322","work_id":"d738c48d-e0c3-4351-b469-16a549b6c9c5","shared_citers":1}],"time_series":[{"n":1,"year":2024},{"n":12,"year":2026}],"dependency_candidates":[]},"error":null,"updated_at":"2026-05-14T03:46:11.375192+00:00"},"identity_refresh":{"job_type":"identity_refresh","status":"succeeded","result":{"items":[{"title":"Qwen3 Technical Report","outcome":"unchanged","work_id":"25a4e30c-1232-48e7-9925-02fa12ba7c9e","resolver":"local_arxiv","confidence":0.98,"old_work_id":"25a4e30c-1232-48e7-9925-02fa12ba7c9e"}],"counts":{"fixed":0,"merged":0,"unchanged":1,"quarantined":0,"needs_external_resolution":0},"errors":[],"attempted":1},"error":null,"updated_at":"2026-05-14T03:36:17.207500+00:00"},"role_polarity":{"job_type":"role_polarity","status":"succeeded","result":{"title":"Lawrence Zitnick","claims":[],"why_cited":"Pith tracks Lawrence Zitnick because it crossed a citation-hub threshold.","role_counts":[]},"error":null,"updated_at":"2026-05-14T03:36:13.119732+00:00"},"summary_claims":{"job_type":"summary_claims","status":"succeeded","result":{"title":"Lawrence Zitnick","claims":[],"why_cited":"Pith tracks Lawrence Zitnick because it crossed a citation-hub threshold.","role_counts":[]},"error":null,"updated_at":"2026-05-14T03:36:17.227842+00:00"}},"summary":{"title":"Lawrence Zitnick","claims":[],"why_cited":"Pith tracks Lawrence Zitnick because it crossed a citation-hub threshold.","role_counts":[]},"graph":{"co_cited":[{"title":"Masked autoencoders are scalable vision learners","work_id":"0a23d1b7-bd56-43cc-8a80-7c43ce994e1e","shared_citers":4},{"title":"& Vondrick, C","work_id":"b8a8bb9e-1d31-40e2-9cab-ae21e338dde6","shared_citers":4},{"title":"Eyes Wide Shut? Exploring the Visual Shortcomings of Multimodal LLMs","work_id":"7efbc2dd-b0f2-4f71-bb1c-d2fcf110d805","shared_citers":2},{"title":"Feature Pyramid Networks for Object Detection","work_id":"dde3fe4f-1210-48b9-851c-ba5177fe8ffb","shared_citers":2},{"title":"Heinig, K","work_id":"cf4c4e77-acaa-46b4-b066-ddf045165d05","shared_citers":2},{"title":"In: 2023 IEEE/CVF International Conference on Computer Vision (ICCV)","work_id":"2a2d1133-ca8a-44c4-a105-9e5f80354b38","shared_citers":2},{"title":"In: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","work_id":"5674e43c-0bd6-4797-9061-d3bd7ec0850f","shared_citers":2},{"title":"In: Proceedings of the IEEE/CVF International Conference on Computer Vision, pp","work_id":"ed935943-7859-442f-aee2-2a1bfda624d4","shared_citers":2},{"title":"Microsoft COCO Captions: Data Collection and Evaluation Server","work_id":"b3d6fb46-4169-4a28-8f7e-2ca6774211da","shared_citers":2},{"title":"Qwen2.5-VL Technical Report","work_id":"69dffacb-bfe8-442d-be86-48624c60426f","shared_citers":2},{"title":"Tomasi and R","work_id":"135418b1-cafd-49fd-803d-1ca6433d4b1b","shared_citers":2},{"title":"URLhttp://dx.doi.org/10.1109/CVPR.2016.90","work_id":"b353bda2-591d-479a-9c8b-22dfcba12431","shared_citers":2},{"title":"You Only Look Once: Unified, Real-Time Object Detection","work_id":"37ab4f11-9f69-480d-aab9-e7d9826c586d","shared_citers":2},{"title":"1768 , publisher=","work_id":"b5ff924c-4267-4b08-8c95-566ceb3bab96","shared_citers":1},{"title":"1981.Multiple Attribute Decision Making: Methods and Applications","work_id":"7698541c-ce5a-4ef7-b576-ceae0dcc5e63","shared_citers":1},{"title":"2008 , url=","work_id":"0ce6a061-cd10-461d-9646-57e211c62876","shared_citers":1},{"title":"2010, Classical and Quantum Gravity, 27, 084013, doi: 10.1088/0264-9381/27/8/084013","work_id":"aa092362-d6ae-447d-b2ca-7848b8743d54","shared_citers":1},{"title":"2010, in Proceedings of COMPSTAT’2010: 19th International Conference on Computational Statistics, Springer, 177–186, doi: 10.1007/978-3-7908-2604-3_16","work_id":"87a76526-2ebb-424d-85ac-8c96da34f3bd","shared_citers":1},{"title":"2011, International Journal of Modern Physics D, 20, 989, doi: 10.1142/S0218271811019335","work_id":"e3eb42a2-83d5-436d-a9af-658cac917ad0","shared_citers":1},{"title":"2016, in 2016 Fourth International Conference on 3D Vision (3DV), IEEE, 565–571, doi: 10.1109/3DV.2016.79","work_id":"43e6c945-3b53-46f1-b9c3-b53708f491c3","shared_citers":1},{"title":"2017, Astronomy and Computing, 18, 35, doi: 10.1016/j.ascom.2017.01.002","work_id":"02b908e1-075e-47d6-899a-fba0ff00454c","shared_citers":1},{"title":"2017 , eprint=","work_id":"2c923374-2fee-4c42-a0f9-f706b8a72242","shared_citers":1},{"title":"2017 , eprint=","work_id":"72d4171a-6c4c-41a9-b5b1-a38637a23f93","shared_citers":1},{"title":"2017, in Proceedings of the IEEE International Conference on Computer Vision, 2961–2969, doi: 10.1109/ICCV.2017.322","work_id":"d738c48d-e0c3-4351-b469-16a549b6c9c5","shared_citers":1}],"time_series":[{"n":1,"year":2024},{"n":12,"year":2026}],"dependency_candidates":[]},"authors":[{"id":"594baa5f-8b5f-49d9-893d-80f061c4a41a","orcid":null,"display_name":"C. Lawrence Zitnick","source":"manual","import_confidence":0.72},{"id":"357117ed-8a94-478b-93d0-35124e4d9a73","orcid":null,"display_name":"Deva Ramanan","source":"manual","import_confidence":0.72},{"id":"688e76cc-a7a9-4957-a415-5ad7189d073f","orcid":null,"display_name":"James Hays","source":"manual","import_confidence":0.72},{"id":"4cdcb464-a6d3-44b3-a8fe-9e19975a8c9f","orcid":null,"display_name":"Michael Maire","source":"manual","import_confidence":0.72},{"id":"46597a21-9794-47fe-a568-b329b5dee25f","orcid":null,"display_name":"Pietro Perona","source":"manual","import_confidence":0.72},{"id":"9673a109-8699-40f3-b9a4-3da58f8bdde6","orcid":null,"display_name":"Piotr Dollár","source":"manual","import_confidence":0.72},{"id":"36afc0d9-76dd-4868-9798-8e85bf567350","orcid":null,"display_name":"Serge Belongie","source":"manual","import_confidence":0.72},{"id":"00e2756c-d70b-49a9-b019-ad42b25d5fab","orcid":null,"display_name":"Tsung-Yi Lin","source":"manual","import_confidence":0.72}]}}