{"674259":{"#nid":"674259","#data":{"type":"event","title":"IC Distinguished Lecture Series with Guest Speaker Noah Smith","body":[{"value":"\u003Cp\u003E\u003Cstrong\u003EAbstract\u003C\/strong\u003E\u003C\/p\u003E\r\n\r\n\u003Cp\u003ENeural language models with billions of parameters and trained on trillions of words are powering the fastest-growing computing applications in history and generating discussion and debate around the world. Yet most scientists cannot study or improve those state-of-the-art models because the organizations deploying them keep their data and machine learning processes secret. I believe that the path to models that are usable by all, at low cost, customizable for areas of critical need like the sciences, and whose capabilities and limitations are made transparent and understandable, is\u0026nbsp;\u003Cem\u003Eradically open development\u003C\/em\u003E, with academic and not-for-profit researchers empowered to do reproducible science.\u0026nbsp;Projects like Falcon, Llama, MPT, and Pythia provide glimmers of hope.\u0026nbsp; In this talk, I\u2019ll share the story of the work our team is doing to radically open up the science of language modeling.\u0026nbsp;As of April 2024, we\u2019ve released Dolma, a three-trillion-token open dataset curated for training language models, and used it to pretrain OLMo v1, also publicly released. We\u2019ve also built and released T\u00fclu, a series of open instruction-tuned models.\u0026nbsp;All of these come with open-source code and extensive documentation, including new tools for evaluation.\u0026nbsp;Together these artifacts make it possible to explore new scientific questions and democratize control of the future of this fascinating and important technology.\u0026nbsp;\u0026nbsp;\u003C\/p\u003E\r\n\r\n\u003Cp\u003EThe work I\u2019ll present was carried out primarily by a large team at the Allen Institute for Artificial Intelligence in Seattle, with collaboration from the Paul G. Allen School at the University of Washington and various kinds of support and coordination from many organizations, including the Kempner Institute for the Study of Natural and Artificial Intelligence at Harvard University, AMD, CSC - IT Center for Science (Finland), Databricks, and\u0026nbsp;Together.ai. \u0026nbsp;\u003C\/p\u003E\r\n","summary":"","format":"limited_html"}],"field_subtitle":"","field_summary":[{"value":"\u003Cp\u003E\u003Cstrong\u003ETalk Title \u2014 It\u2019s Time to Open Up Language Models\u003C\/strong\u003E\u003C\/p\u003E\r\n","format":"limited_html"}],"field_summary_sentence":[{"value":"Talk Title \u2014 It\u2019s Time to Open Up Language Models"}],"uid":"36530","created_gmt":"2024-04-18 15:11:42","changed_gmt":"2024-04-18 15:18:42","author":"Nathan Deen","boilerplate_text":"","field_publication":"","field_article_url":"","field_event_time":{"event_time_start":"2024-04-26T11:00:40-04:00","event_time_end":"2024-04-26T12:00:00-04:00","event_time_end_last":"2024-04-26T12:00:00-04:00","gmt_time_start":"2024-04-26 15:00:40","gmt_time_end":"2024-04-26 16:00:00","gmt_time_end_last":"2024-04-26 16:00:00","rrule":null,"timezone":"America\/New_York"},"location":"Technology Square Research Building, 1st Floor Auditorium, Room 118","extras":[],"hg_media":{"673750":{"id":"673750","type":"image","title":"nasmith_headshot.jpeg","body":null,"created":"1713453368","gmt_created":"2024-04-18 15:16:08","changed":"1713453368","gmt_changed":"2024-04-18 15:16:08","alt":"Noah Smith","file":{"fid":"257183","name":"nasmith_headshot.jpeg","image_path":"\/sites\/default\/files\/2024\/04\/18\/nasmith_headshot.jpeg","image_full_path":"http:\/\/hg.gatech.edu\/\/sites\/default\/files\/2024\/04\/18\/nasmith_headshot.jpeg","mime":"image\/jpeg","size":418048,"path_740":"http:\/\/hg.gatech.edu\/sites\/default\/files\/styles\/740xx_scale\/public\/2024\/04\/18\/nasmith_headshot.jpeg?itok=Yltg76ei"}}},"media_ids":["673750"],"groups":[{"id":"47223","name":"College of Computing"},{"id":"50876","name":"School of Interactive Computing"}],"categories":[],"keywords":[],"core_research_areas":[],"news_room_topics":[],"event_categories":[],"invited_audience":[],"affiliations":[],"classification":[],"areas_of_expertise":[],"news_and_recent_appearances":[],"phone":[],"contact":[{"value":"\u003Cp\u003ENathan Deen\u003C\/p\u003E\r\n\r\n\u003Cp\u003ECommunications Officer I\u003C\/p\u003E\r\n\r\n\u003Cp\u003ESchool of Interactive Computing\u003C\/p\u003E\r\n","format":"limited_html"}],"email":[],"slides":[],"orientation":[],"userdata":""}}}