{"id":10159,"date":"2025-02-11T09:56:04","date_gmt":"2025-02-11T09:56:04","guid":{"rendered":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/?post_type=gsma_theme_study&#038;p=10159"},"modified":"2025-02-11T10:41:46","modified_gmt":"2025-02-11T10:41:46","slug":"addressing-the-ai-language-gap","status":"publish","type":"gsma_theme_study","link":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/","title":{"rendered":"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM)"},"content":{"rendered":"\n<p class=\"wp-block-paragraph\">VEON\u2019s Beeline Kazakhstan and its software company QazCode, in collaboration with the Government of Kazakhstan and Nazarbayev University, have developed an open-source Kazakh-language large language model (Kaz-LLM). This project accelerates the adoption of AI-powered products while addressing the the global challenge on the AI language gap for low-resource languages . With over 150 billion tokens collected, curated, synthesized, and translated, the Kaz-LLM interacts seamlessly in Kazakh, Turkish, English, and Russian. The project received technical support from Foundry strategic partners Barcelona Supercomputer (BSC).<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">Partners: Veon, Barcelona Supercomputer, Beeline Kazakhstan, Qazcode<\/p>\n\n\n\n<p class=\"wp-block-paragraph\"><\/p>\n","protected":false},"excerpt":{"rendered":"<p>VEON\u2019s Beeline Kazakhstan and its software company QazCode, in collaboration with the Government of Kazakhstan and Nazarbayev University, have developed an open-source Kazakh-language large language model (Kaz-LLM). This project accelerates the adoption of AI-powered products while addressing the the global challenge on the AI language gap for low-resource languages . With over 150 billion tokens [&hellip;]<\/p>\n","protected":false},"author":21,"featured_media":10162,"template":"","meta":{"image":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","json":{"gsma_study_logo":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/veon-logo-black.png","gsma_study_category":"0","gsma_study_member":"0","gsma_study_website":"","gsma_study_email":"","gsma_study_twitter":"","gsma_study_facebook":"","gsma_study_linkedin":"","gsma_study_country":"","gsma_study_bg":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","gsma_study_video":"","gsma_study_sdg":"","gsma_study_hfi":null,"gsma_study_orgs":"10157"},"cats":[],"orgs":[{"ID":10157,"post_author":"21","post_date":"2025-02-11 09:52:11","post_date_gmt":"2025-02-11 09:52:11","post_content":"","post_title":"Veon","post_excerpt":"","post_status":"publish","comment_status":"closed","ping_status":"closed","post_password":"","post_name":"veon","to_ping":"","pinged":"","post_modified":"2025-02-11 10:01:30","post_modified_gmt":"2025-02-11 10:01:30","post_content_filtered":"","post_parent":0,"guid":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/?post_type=gsma_theme_orgs&#038;p=10157","menu_order":0,"post_type":"gsma_theme_orgs","post_mime_type":"","comment_count":"0","filter":"raw","logo":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/veon-logo-black.png"}]},"tags":[],"casestudy_categories":[],"algolia_discover_type":[],"class_list":["post-10159","gsma_theme_study","type-gsma_theme_study","status-publish","has-post-thumbnail","hentry"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v24.4 (Yoast SEO v24.4) - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM) - GSMA Foundry<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM)\" \/>\n<meta property=\"og:description\" content=\"VEON\u2019s Beeline Kazakhstan and its software company QazCode, in collaboration with the Government of Kazakhstan and Nazarbayev University, have developed an open-source Kazakh-language large language model (Kaz-LLM). This project accelerates the adoption of AI-powered products while addressing the the global challenge on the AI language gap for low-resource languages . With over 150 billion tokens [&hellip;]\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/\" \/>\n<meta property=\"og:site_name\" content=\"GSMA Foundry\" \/>\n<meta property=\"article:modified_time\" content=\"2025-02-11T10:41:46+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg\" \/>\n\t<meta property=\"og:image:width\" content=\"2560\" \/>\n\t<meta property=\"og:image:height\" content=\"1463\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/jpeg\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:site\" content=\"@gsma\" \/>\n<meta name=\"twitter:label1\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data1\" content=\"1 minute\" \/>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM) - GSMA Foundry","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/","og_locale":"en_US","og_type":"article","og_title":"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM)","og_description":"VEON\u2019s Beeline Kazakhstan and its software company QazCode, in collaboration with the Government of Kazakhstan and Nazarbayev University, have developed an open-source Kazakh-language large language model (Kaz-LLM). This project accelerates the adoption of AI-powered products while addressing the the global challenge on the AI language gap for low-resource languages . With over 150 billion tokens [&hellip;]","og_url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/","og_site_name":"GSMA Foundry","article_modified_time":"2025-02-11T10:41:46+00:00","og_image":[{"width":2560,"height":1463,"url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","type":"image\/jpeg"}],"twitter_card":"summary_large_image","twitter_site":"@gsma","twitter_misc":{"Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/","name":"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM) - GSMA Foundry","isPartOf":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#website"},"primaryImageOfPage":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/#primaryimage"},"image":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/#primaryimage"},"thumbnailUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","datePublished":"2025-02-11T09:56:04+00:00","dateModified":"2025-02-11T10:41:46+00:00","breadcrumb":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/#primaryimage","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","contentUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2025\/02\/Addressing-the-AI-Language-Gap-scaled.jpg","width":2560,"height":1463,"caption":"Artificial intelligence technology concept with AI text on electronic circuit board. which is talking about digital transformation, business, modern technology and synchronized network connection."},{"@type":"BreadcrumbList","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/gsma_study\/addressing-the-ai-language-gap\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/"},{"@type":"ListItem","position":2,"name":"Addressing the AI Language Gap: Development of the Kazakh-language Large Language Model (Kaz-LLM)"}]},{"@type":"WebSite","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#website","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/","name":"GSMA Foundry","description":"","publisher":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#organization","name":"GSMA Foundry","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/logo\/image\/","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2024\/06\/GSMA-Logo-Red-RGB_square.jpg","contentUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2024\/06\/GSMA-Logo-Red-RGB_square.jpg","width":600,"height":600,"caption":"GSMA Foundry"},"image":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/logo\/image\/"},"sameAs":["https:\/\/x.com\/gsma"]}]}},"cats":[{"term_id":223,"name":"5G","slug":"5g","term_group":0,"term_taxonomy_id":223,"taxonomy":"casestudy_categories","description":"","parent":73,"count":8,"filter":"raw"},{"term_id":82,"name":"5G Monetisation","slug":"5g_monetisation","term_group":0,"term_taxonomy_id":82,"taxonomy":"casestudy_categories","description":"","parent":73,"count":13,"filter":"raw"},{"term_id":235,"name":"APIs","slug":"apis","term_group":0,"term_taxonomy_id":235,"taxonomy":"casestudy_categories","description":"","parent":0,"count":1,"filter":"raw"},{"term_id":447,"name":"Automotive","slug":"automotive","term_group":0,"term_taxonomy_id":447,"taxonomy":"casestudy_categories","description":"","parent":0,"count":0,"filter":"raw"},{"term_id":448,"name":"Automotive","slug":"automotive-industry","term_group":0,"term_taxonomy_id":448,"taxonomy":"casestudy_categories","description":"","parent":71,"count":1,"filter":"raw"},{"term_id":78,"name":"Automotive &amp; Aviation","slug":"automotive-aviation","term_group":0,"term_taxonomy_id":78,"taxonomy":"casestudy_categories","description":"","parent":71,"count":9,"filter":"raw"},{"term_id":73,"name":"Benefit","slug":"benefit","term_group":0,"term_taxonomy_id":73,"taxonomy":"casestudy_categories","description":"","parent":0,"count":1,"filter":"raw"},{"term_id":87,"name":"CapEx \/ OpEx Reduction","slug":"capex","term_group":0,"term_taxonomy_id":87,"taxonomy":"casestudy_categories","description":"","parent":73,"count":3,"filter":"raw"},{"term_id":88,"name":"Cost Reduction \/ Value","slug":"cost_reduction","term_group":0,"term_taxonomy_id":88,"taxonomy":"casestudy_categories","description":"","parent":73,"count":10,"filter":"raw"},{"term_id":81,"name":"delivered","slug":"delivered","term_group":0,"term_taxonomy_id":81,"taxonomy":"casestudy_categories","description":"","parent":76,"count":55,"filter":"raw"},{"term_id":74,"name":"Efficiency","slug":"efficiency","term_group":0,"term_taxonomy_id":74,"taxonomy":"casestudy_categories","description":"","parent":73,"count":23,"filter":"raw"},{"term_id":91,"name":"FinTech","slug":"fintech","term_group":0,"term_taxonomy_id":91,"taxonomy":"casestudy_categories","description":"","parent":71,"count":4,"filter":"raw"},{"term_id":83,"name":"Global Reach","slug":"global","term_group":0,"term_taxonomy_id":83,"taxonomy":"casestudy_categories","description":"","parent":73,"count":12,"filter":"raw"},{"term_id":215,"name":"GSMA Foundry project","slug":"gsma-foundry-project","term_group":0,"term_taxonomy_id":215,"taxonomy":"casestudy_categories","description":"","parent":0,"count":11,"filter":"raw"},{"term_id":92,"name":"Identity","slug":"identity","term_group":0,"term_taxonomy_id":92,"taxonomy":"casestudy_categories","description":"","parent":71,"count":4,"filter":"raw"},{"term_id":77,"name":"in progress","slug":"in_progress","term_group":0,"term_taxonomy_id":77,"taxonomy":"casestudy_categories","description":"","parent":76,"count":3,"filter":"raw"},{"term_id":71,"name":"Industry","slug":"industry","term_group":0,"term_taxonomy_id":71,"taxonomy":"casestudy_categories","description":"","parent":0,"count":0,"filter":"raw"},{"term_id":89,"name":"Interoperability","slug":"interoperability","term_group":0,"term_taxonomy_id":89,"taxonomy":"casestudy_categories","description":"","parent":73,"count":7,"filter":"raw"},{"term_id":214,"name":"Logistics, Asset Tracking","slug":"logistics-asset-tracking","term_group":0,"term_taxonomy_id":214,"taxonomy":"casestudy_categories","description":"","parent":0,"count":0,"filter":"raw"},{"term_id":79,"name":"Logistics, Monitoring &amp; Surveillance","slug":"logistics","term_group":0,"term_taxonomy_id":79,"taxonomy":"casestudy_categories","description":"","parent":71,"count":12,"filter":"raw"},{"term_id":80,"name":"Network Efficiency \/ Reliability","slug":"network","term_group":0,"term_taxonomy_id":80,"taxonomy":"casestudy_categories","description":"","parent":73,"count":27,"filter":"raw"},{"term_id":72,"name":"Networks &amp; Telecommunications","slug":"networks","term_group":0,"term_taxonomy_id":72,"taxonomy":"casestudy_categories","description":"","parent":71,"count":30,"filter":"raw"},{"term_id":90,"name":"New Revenues","slug":"revenues","term_group":0,"term_taxonomy_id":90,"taxonomy":"casestudy_categories","description":"","parent":73,"count":10,"filter":"raw"},{"term_id":102,"name":"Non-Terrestrial Networks","slug":"non-terrestrial-networks","term_group":0,"term_taxonomy_id":102,"taxonomy":"casestudy_categories","description":"","parent":71,"count":9,"filter":"raw"},{"term_id":459,"name":"Quantum","slug":"quantum","term_group":0,"term_taxonomy_id":459,"taxonomy":"casestudy_categories","description":"","parent":0,"count":0,"filter":"raw"},{"term_id":84,"name":"Security","slug":"security","term_group":0,"term_taxonomy_id":84,"taxonomy":"casestudy_categories","description":"","parent":71,"count":9,"filter":"raw"},{"term_id":85,"name":"Smart Cities","slug":"smart-cities","term_group":0,"term_taxonomy_id":85,"taxonomy":"casestudy_categories","description":"","parent":71,"count":6,"filter":"raw"},{"term_id":86,"name":"Smart Production &amp; Manufacturing","slug":"smart-production","term_group":0,"term_taxonomy_id":86,"taxonomy":"casestudy_categories","description":"","parent":71,"count":10,"filter":"raw"},{"term_id":76,"name":"Status","slug":"status","term_group":0,"term_taxonomy_id":76,"taxonomy":"casestudy_categories","description":"","parent":0,"count":1,"filter":"raw"},{"term_id":75,"name":"Sustainability","slug":"sustainability","term_group":0,"term_taxonomy_id":75,"taxonomy":"casestudy_categories","description":"","parent":73,"count":10,"filter":"raw"},{"term_id":451,"name":"Wearables","slug":"wearables","term_group":0,"term_taxonomy_id":451,"taxonomy":"casestudy_categories","description":"","parent":0,"count":1,"filter":"raw"}],"_links":{"self":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/gsma_theme_study\/10159","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/gsma_theme_study"}],"about":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/types\/gsma_theme_study"}],"author":[{"embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/users\/21"}],"version-history":[{"count":3,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/gsma_theme_study\/10159\/revisions"}],"predecessor-version":[{"id":10167,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/gsma_theme_study\/10159\/revisions\/10167"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/media\/10162"}],"wp:attachment":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/media?parent=10159"}],"wp:term":[{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/tags?post=10159"},{"taxonomy":"casestudy_categories","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/casestudy_categories?post=10159"},{"taxonomy":"algolia_discover_type","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/algolia_discover_type?post=10159"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}