Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions data/2025Q4/1-fetch/smithsonian_1_metrics.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
"CC0_RECORDS","CC0_RECORDS_WITH_CC0_MEDIA","CC0_MEDIA","CC0_MEDIA_PERCENTAGE","TOTAL_OBJECTS"
"14273329","5199915","4503016","36","15616799"
39 changes: 39 additions & 0 deletions data/2025Q4/1-fetch/smithsonian_2_units.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
"UNIT","CC0_RECORDS","CC0_RECORDS_WITH_CC0_MEDIA","TOTAL_OBJECTS"
"AAA","0","0","29735"
"AAG","0","0","344"
"ACM","251","247","2977"
"ACMA","0","0","57"
"CFCHFOLKLIFE","17544","0","18517"
"CHNDM","58158","54590","201545"
"FBR","1517","37","11248"
"FSG","4720","4720","45588"
"HAC","430","430","1437"
"HMSG","449","448","13898"
"HSFA","0","0","299"
"NASM","1010","989","32325"
"NMAAHC","22224","4465","22577"
"NMAH","1316502","10548","1317248"
"NMAI","237637","180","239307"
"NMAfA","111","111","12477"
"NMNHANTHRO","497734","0","497734"
"NMNHBIRDS","635217","559038","635217"
"NMNHBOTANY","4562256","3572487","4562256"
"NMNHEDUCATION","6473","4090","6473"
"NMNHENTO","731838","197223","731838"
"NMNHFISHES","502585","10806","502585"
"NMNHHERPS","615308","2345","615308"
"NMNHINV","2003972","70094","2003972"
"NMNHMAMMALS","626133","542046","626133"
"NMNHMINSCI","465275","11311","465275"
"NMNHPALEO","743533","94487","743533"
"NPG","15446","14540","123566"
"NPM","10814","8005","83710"
"NZP","1061","1061","2086"
"OCIO_DPO3D","108","17","146"
"OFEO-SG","5509","3665","7295"
"SAAM","13626","12891","188157"
"SIA","35498","5477","48169"
"SIL","1035579","13567","1039087"
"SILAF","63416","0","63416"
"SILNMAHTL","34577","0","34577"
"SLA_SRO","104811","0","104811"
352 changes: 352 additions & 0 deletions data/2025Q4/1-fetch/wikipedia_count_by_languages.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,352 @@
"LANGUAGE_CODE","LANGUAGE_NAME_EN","LANGUAGE_NAME","COUNT"
"ab","Abkhazian","аԥсшәа","6478"
"ace","Acehnese","Acèh","13010"
"ady","Adyghe","адыгабзэ","617"
"af","Afrikaans","Afrikaans","127192"
"alt","Southern Altai","алтай тил","1102"
"am","Amharic","አማርኛ","15457"
"ami","Amis","Pangcah","1145"
"an","Aragonese","aragonés","50631"
"ang","Old English","Ænglisc","5023"
"ann","Obolo","Obolo","433"
"anp","Angika","अंगिका","1669"
"ar","Arabic","العربية","1287138"
"arc","Aramaic","ܐܪܡܝܐ","1915"
"ary","Moroccan Arabic","الدارجة","10914"
"arz","Egyptian Arabic","مصرى","1629627"
"as","Assamese","অসমীয়া","20329"
"ast","Asturian","asturianu","138140"
"atj","Atikamekw","Atikamekw","2076"
"av","Avaric","авар","4003"
"avk","Kotava","Kotava","29899"
"awa","Awadhi","अवधी","2541"
"ay","Aymara","Aymar aru","5246"
"az","Azerbaijani","azərbaycanca","209376"
"azb","South Azerbaijani","تۆرکجه","244390"
"ba","Bashkir","башҡортса","63914"
"ban","Balinese","Basa Bali","34260"
"bar","Bavarian","Boarisch","27201"
"bbc","Batak Toba","Batak Toba","1261"
"bcl","Central Bikol","Bikol Central","21213"
"bdr","West Coast Bajau","Bajau Sama","236"
"be","Belarusian","беларуская","257360"
"be-tarask","Belarusian (Taraškievica orthography)","беларуская (тарашкевіца)","89937"
"bew","Betawi","Betawi","3075"
"bg","Bulgarian","български","306660"
"bh","Bhojpuri","भोजपुरी","8857"
"bi","Bislama","Bislama","1478"
"bjn","Banjar","Banjar","11444"
"blk","Pa'O","ပအိုဝ်ႏဘာႏသာႏ","2907"
"bm","Bambara","bamanankan","922"
"bn","Bangla","বাংলা","177623"
"bo","Tibetan","བོད་ཡིག","7361"
"bpy","Bishnupriya","বিষ্ণুপ্রিয়া মণিপুরী","25092"
"br","Breton","brezhoneg","89866"
"bs","Bosnian","bosanski","96166"
"btm","Batak Mandailing","Batak Mandailing","1188"
"bug","Buginese","Basa Ugi","15955"
"bxr","Russia Buriat","буряад","2911"
"ca","Catalan","català","784500"
"cbk-zam","Chavacano","Chavacano de Zamboanga","3236"
"cdo","Mindong","閩東語 / Mìng-dĕ̤ng-ngṳ̄","16690"
"ce","Chechen","нохчийн","685499"
"ceb","Cebuano","Cebuano","6115864"
"ch","Chamorro","Chamoru","558"
"cho","Choctaw","Chahta anumpa","6"
"chr","Cherokee","ᏣᎳᎩ","999"
"chy","Cheyenne","Tsetsêhestâhese","724"
"ckb","Central Kurdish","کوردی","79276"
"co","Corsican","corsu","8621"
"cr","Cree","Nēhiyawēwin / ᓀᐦᐃᔭᐍᐏᐣ","14"
"crh","Crimean Tatar","qırımtatarca","29622"
"cs","Czech","čeština","580814"
"csb","Kashubian","kaszëbsczi","5498"
"cu","Church Slavic","словѣньскъ / ⰔⰎⰑⰂⰡⰐⰠⰔⰍⰟ","1312"
"cv","Chuvash","чӑвашла","58098"
"cy","Welsh","Cymraeg","283788"
"da","Danish","dansk","311557"
"dag","Dagbani","dagbanli","13337"
"de","German","Deutsch","3071559"
"dga","Southern Dagaare","Dagaare","2932"
"din","Dinka","Thuɔŋjäŋ","339"
"diq","Dimli","Zazaki","42344"
"dsb","Lower Sorbian","dolnoserbski","3425"
"dtp","Central Dusun","Kadazandusun","1714"
"dty","Doteli","डोटेली","3629"
"dv","Divehi","ދިވެހިބަސް","3192"
"dz","Dzongkha","ཇོང་ཁ","377"
"ee","Ewe","eʋegbe","1268"
"el","Greek","Ελληνικά","261141"
"eml","Emiliano-Romagnolo","emiliàn e rumagnòl","13724"
"en","English","English","7095068"
"eo","Esperanto","Esperanto","378174"
"es","Spanish","español","2075904"
"et","Estonian","eesti","255971"
"eu","Basque","euskara","475858"
"ext","Extremaduran","estremeñu","4070"
"fa","Persian","فارسی","1062741"
"fat","Fanti","mfantse","1764"
"ff","Fula","Fulfulde","12884"
"fi","Finnish","suomi","608129"
"fj","Fijian","Na Vosa Vakaviti","1612"
"fo","Faroese","føroyskt","14179"
"fon","Fon","fɔ̀ngbè","3331"
"fr","French","français","2721837"
"frp","Arpitan","arpetan","5814"
"frr","Northern Frisian","Nordfriisk","20688"
"fur","Friulian","furlan","4885"
"fy","Western Frisian","Frysk","58562"
"ga","Irish","Gaeilge","62646"
"gag","Gagauz","Gagauz","3013"
"gan","Gan","贛語","6814"
"gcr","Guianan Creole","kriyòl gwiyannen","1075"
"gd","Scottish Gaelic","Gàidhlig","16017"
"gl","Galician","galego","227840"
"glk","Gilaki","گیلکی","48352"
"gn","Guarani","Avañe'ẽ","5980"
"gom","Goan Konkani","गोंयची कोंकणी / Gõychi Konknni","3643"
"gor","Gorontalo","Bahasa Hulontalo","14906"
"got","Gothic","𐌲𐌿𐍄𐌹𐍃𐌺","978"
"gpe","Ghanaian Pidgin","Ghanaian Pidgin","4067"
"gsw","Alemannic","Alemannisch","31395"
"gu","Gujarati","ગુજરાતી","30723"
"guc","Wayuu","wayuunaiki","687"
"gur","Frafra","farefare","1329"
"guw","Gun","gungbe","1562"
"gv","Manx","Gaelg","7025"
"ha","Hausa","Hausa","72469"
"hak","Hakka Chinese","客家語 / Hak-kâ-ngî","10384"
"haw","Hawaiian","Hawaiʻi","2965"
"he","Hebrew","עברית","386358"
"hi","Hindi","हिन्दी","166788"
"hif","Fiji Hindi","Fiji Hindi","12067"
"ho","Hiri Motu","Hiri Motu","3"
"hr","Croatian","hrvatski","228501"
"hsb","Upper Sorbian","hornjoserbsce","14203"
"ht","Haitian Creole","Kreyòl ayisyen","71297"
"hu","Hungarian","magyar","563323"
"hy","Armenian","հայերեն","323208"
"hyw","Western Armenian","Արեւմտահայերէն","13241"
"ia","Interlingua","interlingua","30150"
"iba","Iban","Jaku Iban","1853"
"id","Indonesian","Bahasa Indonesia","755061"
"ie","Interlingue","Interlingue","13381"
"ig","Igbo","Igbo","44047"
"igl","Igala","Igala","945"
"ii","Sichuan Yi","ꆇꉙ","3"
"ik","Inupiaq","Iñupiatun","604"
"ilo","Iloko","Ilokano","15439"
"inh","Ingush","гӀалгӀай","2411"
"io","Ido","Ido","60127"
"is","Icelandic","íslenska","60834"
"it","Italian","italiano","1945506"
"iu","Inuktitut","ᐃᓄᒃᑎᑐᑦ / inuktitut","430"
"ja","Japanese","日本語","1481303"
"jam","Jamaican Creole English","Patois","1730"
"jbo","Lojban","la .lojban.","1348"
"jv","Javanese","Jawa","74712"
"ka","Georgian","ქართული","187582"
"kaa","Kara-Kalpak","Qaraqalpaqsha","10879"
"kab","Kabyle","Taqbaylit","7005"
"kbd","Kabardian","адыгэбзэ","1637"
"kbp","Kabiye","Kabɩyɛ","1715"
"kcg","Tyap","Tyap","1462"
"kg","Kongo","Kongo","1570"
"kge","Komering","Kumoring","2660"
"ki","Kikuyu","Gĩkũyũ","1907"
"kj","Kuanyama","Kwanyama","4"
"kk","Kazakh","қазақша","241129"
"kl","Kalaallisut","kalaallisut","245"
"km","Khmer","ភាសាខ្មែរ","11805"
"kn","Kannada","ಕನ್ನಡ","34058"
"knc","Central Kanuri","Yerwa Kanuri","1533"
"ko","Korean","한국어","730102"
"koi","Komi-Permyak","перем коми","3468"
"krc","Karachay-Balkar","къарачай-малкъар","2653"
"ks","Kashmiri","کٲشُر","8266"
"ksh","Colognian","Ripoarisch","3037"
"ku","Kurdish","kurdî","90922"
"kus","Kusaal","Kʋsaal","1224"
"kv","Komi","коми","5730"
"kw","Cornish","kernowek","7097"
"ky","Kyrgyz","кыргызча","76092"
"la","Latin","Latina","140740"
"lad","Ladino","Ladino","3883"
"lb","Luxembourgish","Lëtzebuergesch","66079"
"lbe","Lak","лакку","1250"
"lez","Lezghian","лезги","4452"
"lfn","Lingua Franca Nova","Lingua Franca Nova","4498"
"lg","Ganda","Luganda","4409"
"li","Limburgish","Limburgs","15145"
"lij","Ligurian","Ligure","11455"
"lld","Ladin","Ladin","180809"
"lmo","Lombard","lombard","79765"
"ln","Lingala","lingála","4839"
"lo","Lao","ລາວ","5227"
"lrc","Northern Luri","لۊری شومالی","1"
"lt","Lithuanian","lietuvių","224202"
"ltg","Latgalian","latgaļu","1112"
"lv","Latvian","latviešu","138753"
"lzh","Literary Chinese","文言","13879"
"mad","Madurese","Madhurâ","1993"
"mai","Maithili","मैथिली","14252"
"map-bms","Banyumasan","Basa Banyumasan","13942"
"mdf","Moksha","мокшень","7614"
"mg","Malagasy","Malagasy","101368"
"mh","Marshallese","Ebon","4"
"mhr","Eastern Mari","олык марий","11327"
"mi","Māori","Māori","8019"
"min","Minangkabau","Minangkabau","228700"
"mk","Macedonian","македонски","156541"
"ml","Malayalam","മലയാളം","87412"
"mn","Mongolian","монгол","26499"
"mni","Manipuri","ꯃꯤꯇꯩ ꯂꯣꯟ","10454"
"mnw","Mon","ဘာသာမန်","1963"
"mos","Mossi","moore","1306"
"mr","Marathi","मराठी","100775"
"mrj","Western Mari","кырык мары","10429"
"ms","Malay","Bahasa Melayu","434658"
"mt","Maltese","Malti","7656"
"mus","Muscogee","Mvskoke","1"
"mwl","Mirandese","Mirandés","4282"
"my","Burmese","မြန်မာဘာသာ","109824"
"myv","Erzya","эрзянь","7867"
"mzn","Mazanderani","مازِرونی","64346"
"nah","Nahuatl","Nāhuatl","4282"
"nan","Minnan","閩南語 / Bân-lâm-gí","433845"
"nap","Neapolitan","Napulitano","14937"
"nds","Low German","Plattdüütsch","85768"
"nds-nl","Low Saxon","Nedersaksies","8061"
"ne","Nepali","नेपाली","29323"
"new","Newari","नेपाल भाषा","72646"
"ng","Ndonga","Oshiwambo","8"
"nia","Nias","Li Niha","1765"
"nl","Dutch","Nederlands","2203326"
"nn","Norwegian Nynorsk","norsk nynorsk","176886"
"no","Norwegian","norsk","661503"
"nov","Novial","Novial","1881"
"nqo","N’Ko","ߒߞߏ","1580"
"nr","South Ndebele","isiNdebele seSewula","272"
"nrm","Norman","Nouormand","5055"
"nso","Northern Sotho","Sesotho sa Leboa","8783"
"nup","Nupe","Nupe","528"
"nv","Navajo","Diné bizaad","22664"
"ny","Nyanja","Chi-Chewa","1099"
"oc","Occitan","occitan","90398"
"olo","Livvi-Karelian","livvinkarjala","4636"
"om","Oromo","Oromoo","1960"
"or","Odia","ଓଡ଼ିଆ","20057"
"os","Ossetic","ирон","21371"
"pa","Punjabi","ਪੰਜਾਬੀ","58920"
"pag","Pangasinan","Pangasinan","2618"
"pam","Pampanga","Kapampangan","10138"
"pap","Papiamento","Papiamentu","4992"
"pcd","Picard","Picard","6034"
"pcm","Nigerian Pidgin","Naijá","1522"
"pdc","Pennsylvania German","Deitsch","2040"
"pfl","Palatine German","Pälzisch","2829"
"pi","Pali","पालि","290"
"pl","Polish","polski","1675671"
"pms","Piedmontese","Piemontèis","70675"
"pnb","Western Punjabi","پنجابی","74688"
"pnt","Pontic","Ποντιακά","489"
"ps","Pashto","پښتو","20828"
"pt","Portuguese","português","1160718"
"pwn","Paiwan","pinayuanan","376"
"qu","Quechua","Runa Simi","24279"
"rki","Arakanese","ရခိုင်","1076"
"rm","Romansh","rumantsch","3813"
"rmy","Vlax Romani","romani čhib","756"
"rn","Rundi","ikirundi","703"
"ro","Romanian","română","518408"
"roa-tara","Tarantino","tarandíne","9497"
"rsk","Pannonian Rusyn","руски","965"
"ru","Russian","русский","2072909"
"rue","Rusyn","русиньскый","10143"
"rup","Aromanian","armãneashti","1389"
"rw","Kinyarwanda","Ikinyarwanda","8877"
"sa","Sanskrit","संस्कृतम्","12412"
"sah","Yakut","саха тыла","17800"
"sat","Santali","ᱥᱟᱱᱛᱟᱲᱤ","13890"
"sc","Sardinian","sardu","7734"
"scn","Sicilian","sicilianu","26261"
"sco","Scots","Scots","34282"
"sd","Sindhi","سنڌي","19658"
"se","Northern Sami","davvisámegiella","7905"
"sg","Sango","Sängö","368"
"sgs","Samogitian","žemaitėška","17273"
"sh","Serbo-Croatian","srpskohrvatski / српскохрватски","461206"
"shi","Tachelhit","Taclḥit","10878"
"shn","Shan","တႆး","14328"
"si","Sinhala","සිංහල","24813"
"simple","Simple English","Simple English","276499"
"sk","Slovak","slovenčina","256745"
"skr","Saraiki","سرائیکی","24335"
"sl","Slovenian","slovenščina","195688"
"sm","Samoan","Gagana Samoa","1198"
"smn","Inari Sami","anarâškielâ","6491"
"sn","Shona","chiShona","11497"
"so","Somali","Soomaaliga","9099"
"sq","Albanian","shqip","104705"
"sr","Serbian","српски / srpski","713007"
"srn","Sranan Tongo","Sranantongo","1128"
"ss","Swati","SiSwati","1133"
"st","Southern Sotho","Sesotho","1546"
"stq","Saterland Frisian","Seeltersk","4129"
"su","Sundanese","Sunda","62154"
"sv","Swedish","svenska","2619580"
"sw","Swahili","Kiswahili","102737"
"syl","Sylheti","ꠍꠤꠟꠐꠤ","1195"
"szl","Silesian","ślůnski","59570"
"szy","Sakizaya","Sakizaya","2735"
"ta","Tamil","தமிழ்","178645"
"tay","Atayal","Tayal","2582"
"tcy","Tulu","ತುಳು","2874"
"tdd","Tai Nuea","ᥖᥭᥰ ᥖᥬᥲ ᥑᥨᥒᥰ","441"
"te","Telugu","తెలుగు","117091"
"tet","Tetum","tetun","1380"
"tg","Tajik","тоҷикӣ","116055"
"th","Thai","ไทย","177772"
"ti","Tigrinya","ትግርኛ","335"
"tig","Tigre","ትግሬ","41"
"tk","Turkmen","Türkmençe","7028"
"tl","Tagalog","Tagalog","48776"
"tly","Talysh","tolışi","10047"
"tn","Tswana","Setswana","3385"
"to","Tongan","lea faka-Tonga","2043"
"tpi","Tok Pisin","Tok Pisin","1407"
"tr","Turkish","Türkçe","653026"
"trv","Taroko","Seediq","1201"
"ts","Tsonga","Xitsonga","956"
"tt","Tatar","татарча / tatarça","560372"
"tum","Tumbuka","chiTumbuka","18796"
"tw","Twi","Twi","4624"
"ty","Tahitian","reo tahiti","1250"
"tyv","Tuvinian","тыва дыл","4042"
"udm","Udmurt","удмурт","5714"
"ug","Uyghur","ئۇيغۇرچە / Uyghurche","9614"
"uk","Ukrainian","українська","1397827"
"ur","Urdu","اردو","235319"
"uz","Uzbek","oʻzbekcha / ўзбекча","315519"
"ve","Venda","Tshivenda","822"
"vec","Venetian","vèneto","69525"
"vep","Veps","vepsän kel’","7076"
"vi","Vietnamese","Tiếng Việt","1296456"
"vls","West Flemish","West-Vlams","8217"
"vo","Volapük","Volapük","46139"
"vro","Võro","võro","6858"
"wa","Walloon","walon","12797"
"war","Waray","Winaray","1266823"
"wo","Wolof","Wolof","1743"
"wuu","Wu","吴语","46974"
"xal","Kalmyk","хальмг","1596"
"xh","Xhosa","isiXhosa","2318"
"xmf","Mingrelian","მარგალური","21934"
"yi","Yiddish","ייִדיש","15634"
"yo","Yoruba","Yorùbá","36320"
"yue","Cantonese","粵語","148076"
"za","Zhuang","Vahcuengh","3005"
"zea","Zeelandic","Zeêuws","7092"
"zgh","Standard Moroccan Tamazight","ⵜⴰⵎⴰⵣⵉⵖⵜ ⵜⴰⵏⴰⵡⴰⵢⵜ","11955"
"zh","Chinese","中文","1512195"
"zu","Zulu","isiZulu","11810"
Loading