{"id":15777,"date":"2026-07-02T09:42:20","date_gmt":"2026-07-02T09:42:20","guid":{"rendered":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/?p=15777"},"modified":"2026-07-02T09:42:43","modified_gmt":"2026-07-02T09:42:43","slug":"telecom-common-corpus","status":"publish","type":"post","link":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/","title":{"rendered":"Telecom Common Corpus"},"content":{"rendered":"\n<p class=\"wp-block-paragraph\">GSMA and Pleias.ai have released the Telco Common Corpus \u2014 10+ billion tokens of open, license-verified telecom knowledge covering scientific literature, patents, standards and open-web sources. The first dataset of its kind for the industry, built to supply specialist model training at scale.<\/p>\n\n\n\n<div class=\"wp-block-buttons is-layout-flex wp-block-buttons-is-layout-flex\">\n<div class=\"wp-block-button\"><a class=\"wp-block-button__link wp-element-button\" href=\"https:\/\/www.open-telco.ai\/telco-common-corpus-an-open-verified-data-commons-for-telecom-ai\/\">Read the Blog<\/a><\/div>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>GSMA and Pleias.ai have released the Telco Common Corpus \u2014 10+ billion tokens of open, license-verified telecom knowledge covering scientific literature, patents, standards and open-web sources. The first dataset of its kind for the industry, built to supply specialist model training at scale.<\/p>\n","protected":false},"author":32,"featured_media":15779,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_oasis_is_in_workflow":0,"_oasis_original":0,"_oasis_task_priority":"","footnotes":""},"categories":[125],"tags":[357,406],"algolia_discover_type":[],"class_list":["post-15777","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-artificial-intelligence","tag-ai","tag-technology"],"yoast_head":"<!-- This site is optimized with the Yoast SEO Premium plugin v24.4 (Yoast SEO v27.9) - https:\/\/yoast.com\/product\/yoast-seo-premium-wordpress\/ -->\n<title>Telecom Common Corpus - GSMA Foundry<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"Telecom Common Corpus\" \/>\n<meta property=\"og:description\" content=\"GSMA and Pleias.ai have released the Telco Common Corpus \u2014 10+ billion tokens of open, license-verified telecom knowledge covering scientific literature, patents, standards and open-web sources. The first dataset of its kind for the industry, built to supply specialist model training at scale.\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/\" \/>\n<meta property=\"og:site_name\" content=\"GSMA Foundry\" \/>\n<meta property=\"article:published_time\" content=\"2026-07-02T09:42:20+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2026-07-02T09:42:43+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png\" \/>\n\t<meta property=\"og:image:width\" content=\"616\" \/>\n\t<meta property=\"og:image:height\" content=\"616\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/png\" \/>\n<meta name=\"author\" content=\"nchouhan@gsma.com\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:creator\" content=\"@gsma\" \/>\n<meta name=\"twitter:site\" content=\"@gsma\" \/>\n<meta name=\"twitter:label1\" content=\"Written by\" \/>\n\t<meta name=\"twitter:data1\" content=\"nchouhan@gsma.com\" \/>\n\t<meta name=\"twitter:label2\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data2\" content=\"1 minute\" \/>\n<!-- \/ Yoast SEO Premium plugin. -->","yoast_head_json":{"title":"Telecom Common Corpus - GSMA Foundry","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/","og_locale":"en_US","og_type":"article","og_title":"Telecom Common Corpus","og_description":"GSMA and Pleias.ai have released the Telco Common Corpus \u2014 10+ billion tokens of open, license-verified telecom knowledge covering scientific literature, patents, standards and open-web sources. The first dataset of its kind for the industry, built to supply specialist model training at scale.","og_url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/","og_site_name":"GSMA Foundry","article_published_time":"2026-07-02T09:42:20+00:00","article_modified_time":"2026-07-02T09:42:43+00:00","og_image":[{"width":616,"height":616,"url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","type":"image\/png"}],"author":"nchouhan@gsma.com","twitter_card":"summary_large_image","twitter_creator":"@gsma","twitter_site":"@gsma","twitter_misc":{"Written by":"nchouhan@gsma.com","Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#article","isPartOf":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/"},"author":{"name":"nchouhan@gsma.com","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/person\/aa49e7aa16edc4611533b381c8021368"},"headline":"Telecom Common Corpus","datePublished":"2026-07-02T09:42:20+00:00","dateModified":"2026-07-02T09:42:43+00:00","mainEntityOfPage":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/"},"wordCount":48,"commentCount":0,"publisher":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#organization"},"image":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#primaryimage"},"thumbnailUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","keywords":["AI","Technology"],"articleSection":["Artificial Intelligence"],"inLanguage":"en-US","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#respond"]}]},{"@type":"WebPage","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/","name":"Telecom Common Corpus - GSMA Foundry","isPartOf":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#website"},"primaryImageOfPage":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#primaryimage"},"image":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#primaryimage"},"thumbnailUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","datePublished":"2026-07-02T09:42:20+00:00","dateModified":"2026-07-02T09:42:43+00:00","breadcrumb":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#primaryimage","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","contentUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","width":616,"height":616,"caption":"A black infographic with red and white text titled \"TELECOM COMMON CORPUS\" shows over 10B telecom-related tokens sourced from 11 categories. The largest sources are 3GPP docs, US patents, RFC mailing lists, IEEE open access, and EU patents, with token counts and horizontal bars for each."},{"@type":"BreadcrumbList","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/artificial-intelligence\/telecom-common-corpus\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/"},{"@type":"ListItem","position":2,"name":"Telecom Common Corpus"}]},{"@type":"WebSite","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#website","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/","name":"GSMA Foundry","description":"","publisher":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#organization","name":"GSMA Foundry","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/logo\/image\/","url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2024\/06\/GSMA-Logo-Red-RGB_square.jpg","contentUrl":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2024\/06\/GSMA-Logo-Red-RGB_square.jpg","width":600,"height":600,"caption":"GSMA Foundry"},"image":{"@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/logo\/image\/"},"sameAs":["https:\/\/x.com\/gsma"]},{"@type":"Person","@id":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/#\/schema\/person\/aa49e7aa16edc4611533b381c8021368","name":"nchouhan@gsma.com","image":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/secure.gravatar.com\/avatar\/691236268a4d0e917797b23bcec96f8a1afaa607538adaa167d95195ff23ee73?s=96&d=mm&r=g","url":"https:\/\/secure.gravatar.com\/avatar\/691236268a4d0e917797b23bcec96f8a1afaa607538adaa167d95195ff23ee73?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/691236268a4d0e917797b23bcec96f8a1afaa607538adaa167d95195ff23ee73?s=96&d=mm&r=g","caption":"nchouhan@gsma.com"}}]}},"featured_image_url":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-content\/uploads\/2026\/07\/Telecom-Common-Corpus-616x616-1.png","_links":{"self":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/posts\/15777","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/users\/32"}],"replies":[{"embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/comments?post=15777"}],"version-history":[{"count":1,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/posts\/15777\/revisions"}],"predecessor-version":[{"id":15778,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/posts\/15777\/revisions\/15778"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/media\/15779"}],"wp:attachment":[{"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/media?parent=15777"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/categories?post=15777"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/tags?post=15777"},{"taxonomy":"algolia_discover_type","embeddable":true,"href":"https:\/\/www.gsma.com\/get-involved\/gsma-foundry\/wp-json\/wp\/v2\/algolia_discover_type?post=15777"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}