-
Notifications
You must be signed in to change notification settings - Fork 1
/
wikis.json
2567 lines (2567 loc) · 88.4 KB
/
wikis.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
[
[
"English",
"English language",
"[[:en:|en]]",
4234378,
129657,
763,
"English is a West Germanic language that was first spoken in early medieval England and is now the most widely used language in the world."
],
[
"German",
"German language",
"de",
1585992,
20931,
89,
"German (Deutsch [\u02c8d\u0254\u028ft\u0283]\u00a0( listen)) is a West Germanic language related to and classified alongside English and Dutch."
],
[
"Dutch",
"Dutch language",
"nl",
1568516,
4646,
10,
"Dutch (\u00a0Nederlands\u00a0(help\u00b7info)) is a West Germanic language and the native language of most of the population of the Netherlands, and about sixty percent of the populations of Belgium and Suriname, the three member states of the Dutch Language Union."
],
[
"French",
"French language",
"fr",
1386998,
17773,
162,
"French (le fran\u00e7ais [l\u0259 f\u0281\u0251\u0303s\u025b]\u00a0( listen) or la langue fran\u00e7aise [la l\u0251\u0303\u0261 f\u0281\u0251\u0303s\u025bz]) is a Romance language spoken as a first language in France, the Romandy region in Switzerland, Wallonia and Brussels in Belgium, Monaco, the provinces of Quebec and New Brunswick (Acadia region) in Canada, the U."
],
[
"Italian",
"Italian language",
"it",
1033404,
7922,
94,
"Italian (\u00a0italiano\u00a0(help\u00b7info) or lingua italiana) is a Romance language spoken mainly in Europe: Italy, Switzerland, San Marino, Vatican City, by minorities in Malta, Monaco, Croatia, Slovenia, France, Libya, Eritrea, and Somalia, and by expatriate communities in the Americas and Australia."
],
[
"Spanish",
"Spanish language",
"es",
1016704,
16590,
168,
"Spanish (espa\u00f1ol), also called Castilian (castellano \u00a0listen\u00a0(help\u00b7info)), is a Romance language that originated in Castile, a region in Spain."
],
[
"Russian",
"Russian language",
"ru",
1002601,
11844,
106,
"Russian (\u0440\u0443\u0301\u0441\u0441\u043a\u0438\u0439 \u044f\u0437\u044b\u0301\u043a, russkij jazyk, pronounced [\u02c8rusk\u02b2\u026aj j\u026a\u02c8z\u0268k] is a Slavic language spoken primarily in Russia, Belarus, Ukraine, Kazakhstan, and Kyrgyzstan."
],
[
"Swedish",
"Swedish language",
"sv",
974213,
2928,
21,
"Swedish (\u00a0svenska\u00a0(help\u00b7info)) is a North Germanic language, spoken by approximately 10 million people, predominantly in Sweden and parts of Finland, where it has equal legal standing with Finnish."
],
[
"Polish",
"Polish language",
"pl",
967547,
4757,
18,
"Polish (j\u0119zyk polski, polszczyzna) is a language of the Lechitic subgroup of West Slavic languages, used throughout Poland (being that country's official language) and by Polish minorities in other countries."
],
[
"Japanese",
"Japanese language",
"ja",
858311,
12001,
63,
"Japanese (\u65e5\u672c\u8a9e, Nihongo?, [nih\u00f5\u014bgo], [nih\u00f5\u014b\u014bo] \u00a0( listen)) is an East Asian language spoken by about 125 million speakers, primarily in Japan, where it is the national language."
],
[
"Portuguese",
"Portuguese language",
"pt",
781814,
5695,
110,
"Portuguese (\u00a0portugu\u00eas\u00a0(help\u00b7info) or l\u00edngua portuguesa [\u02c8\u026b\u0129gw\u0250 pu\u027etu\u02c8\u0263ez\u0250]) is a Romance language."
],
[
"Chinese",
"Chinese language",
"zh",
694714,
7496,
99,
"Chinese (\u6c49\u8bed/\u6f22\u8a9e H\u00e0ny\u01d4 or \u4e2d\u6587 Zh\u014dngw\u00e9n) is a group of related language varieties, several of which are not mutually intelligible, and is variously described as a language or language family."
],
[
"Vietnamese",
"Vietnamese language",
"vi",
579406,
1118,
23,
"Vietnamese (ti\u1ebfng Vi\u1ec7t) is the national, official language of Vietnam."
],
[
"Ukrainian",
"Ukrainian language",
"uk",
442808,
2058,
40,
"Ukrainian (\u0443\u043a\u0440\u0430\u0457\u0301\u043d\u0441\u044c\u043a\u0430 \u043c\u043e\u0301\u0432\u0430 ukrayins'ka mova, pronounced\u00a0[ukr\u0251\u02c8j\u026a\u0272s\u02b2k\u0251 \u02c8m\u0254w\u0251]) is a member of the East Slavic subgroup of the Slavic languages."
],
[
"Catalan",
"Catalan language",
"ca",
402715,
1500,
26,
"Catalan /\u02c8k\u00e6t\u0259l\u00e6n/ (autonym: catal\u00e0 [k\u0259t\u0259\u02c8\u026ba] or [kata\u02c8\u026ba]) is a Romance language named for its origins in the historical region of Catalonia in the northeastern part of Spain and adjoining parts of what is now France."
],
[
"Norwegian (Bokm\u00e5l)",
"Norwegian (Bokm\u00e5l) language",
"no",
380196,
1836,
28,
"Bokm\u00e5l ([\u02c8bu\u02d0km\u0254\u02d0l], lit. \"book tongue\") is one of two official written standards for the Norwegian language, the other being Nynorsk."
],
[
"Waray-Waray",
"Waray-Waray language",
"war",
377380,
62,
3,
"Waray-Waray (also Waray, Samar-Leyte, and Samarnon) is a language spoken in the provinces of Samar, Northern Samar, Eastern Samar, Biliran, and in the north-east of Leyte Island (surrounding Tacloban) in the Philippines."
],
[
"Cebuano",
"Cebuano language",
"ceb",
359336,
64,
4,
"Cebuano, referred to by most of its speakers as Binisaya (or Visayan in English), is an Austronesian language spoken in the Philippines by about 20 million people, mostly in the Central Visayas, most of whom belong to the Bisaya ethnic group."
],
[
"Finnish",
"Finnish language",
"fi",
322637,
1765,
46,
"Finnish (\u00a0suomi\u00a0(help\u00b7info), or suomen kieli) is the language spoken by the majority of the population in Finland and by ethnic Finns outside Finland."
],
[
"Persian",
"Persian language",
"fa",
307792,
2396,
157,
"Persian (Persian: \u0641\u0627\u0631\u0633\u06cc F\u0101rsi [f\u0252\u02d0\u027e\u02c8si\u02d0]) is an Iranian language within the Indo-Iranian branch of the Indo-European languages."
],
[
"Czech",
"Czech language",
"cs",
265545,
2033,
39,
"Czech (pron.: /\u02c8t\u0283\u025bk/; \u010de\u0161tina Czech pronunciation:\u00a0[\u02c8t\u0361\u0283\u025b\u0283c\u026ana]) is a West Slavic language with about 12 million native speakers; it is the majority language in the Czech Republic and spoken by Czechs worldwide."
],
[
"Hungarian",
"Hungarian language",
"hu",
240342,
1925,
100,
"Hungarian (Hungarian: magyar nyelv \u00a0listen\u00a0(help\u00b7info)) is a member of the Finno-Ugric group of the Uralic languages."
],
[
"Korean",
"Korean language",
"ko",
239090,
1930,
81,
"Korean (Korean: \ud55c\uad6d\uc5b4/\uc870\uc120\ub9d0, see below) is the official language of South Korea and North Korea as well as one of the two official languages in China's Yanbian Korean Autonomous Prefecture."
],
[
"Arabic",
"Arabic language",
"ar",
229755,
3061,
237,
"Arabic (\u0627\u0644\u0639\u0631\u0628\u064a\u0629 al-\u02bbarab\u012byah [al\u0295ara\u02c8bijja]\u00a0( listen) or \u0639\u0631\u0628\u064a/\u0639\u0631\u0628\u0649 \u02bbarab\u012b\u00a0 [\u02c8\u0295arabi\u02d0]\u00a0( listen)) is a name applied to the descendants of the Classical Arabic language of the 6th century AD."
],
[
"Romanian",
"Romanian language",
"ro",
225824,
1063,
87,
"Romanian (or Daco-Romanian; obsolete spellings Rumanian, Roumanian; self-designation: rom\u00e2n\u0103, limba rom\u00e2n\u0103 [\u02c8limba ro\u02c8m\u0268n\u0259]\u00a0( listen) (\"the Romanian language\") or rom\u00e2ne\u0219te (lit. \"in Romanian\") is a Romance language spoken by around 24 million people as a native language, primarily in Romania and Moldova, and by another 4 million people as a second language."
],
[
"Malay",
"Malay language",
"ms",
218599,
346,
18,
"Malay (pron.: /m\u0259\u02c8le\u026a/; Bahasa Melayu; Jawi script: \u0628\u0647\u0627\u0633 \u0645\u0644\u0627\u064a\u0648 ) is a major language of the Austronesian family."
],
[
"Turkish",
"Turkish language",
"tr",
209621,
2697,
216,
"Turkish (\u00a0T\u00fcrk\u00e7e\u00a0(help\u00b7info)), also referred to as Istanbul Turkish or Anatolian Turkish, is the most widely-spoken of the Turkic languages, with over 63 million native speakers."
],
[
"Indonesian",
"Indonesian language",
"id",
208967,
1740,
108,
"Indonesian (Bahasa Indonesia) is the official language of Indonesia."
],
[
"Kazakh",
"Kazakh language",
"kk",
202431,
331,
7,
"Kazakh (also Qazaq, Qazaq\u015fa and variants, natively \u049a\u0430\u0437\u0430\u049b \u0442\u0456\u043b\u0456, Qazaq tili, \u0642\u0627\u0632\u0627\u0642 \u0674\u062a\u0649\u0644\u0649\u200e; pronounced [q\u0251\u02c8z\u0251q t\u0258\u02c8l\u0258]) is a Turkic language which belongs to the Kipchak (or Western Turkic) branch of the Turkic languages, closely related to Nogai and Karakalpak."
],
[
"Serbian",
"Serbian language",
"sr",
187802,
738,
63,
"Serbian (Serbian Cyrillic: \u0441\u0440\u043f\u0441\u043a\u0438, Latin: srpski, pronounced\u00a0[sr\u0329\u0302pski\u02d0]) is a standardized register of the Serbo-Croatian language used by Serbs, mainly in Serbia, Bosnia and Herzegovina (mostly Republika Srpska), Montenegro, Croatia, and Macedonia."
],
[
"Slovak",
"Slovak language",
"sk",
183804,
571,
18,
"Slovak (\u00a0slovensk\u00fd jazyk\u00a0(help\u00b7info), sloven\u010dina, not to be confused with slovenski jezik or sloven\u0161\u010dina, the native name of the Slovene language), is an Indo-European language that belongs to the West Slavic languages (together with Czech, Polish, Silesian, Kashubian, and Sorbian)."
],
[
"Esperanto",
"Esperanto language",
"eo",
180243,
409,
18,
"\u00a0Esperanto\u00a0(help\u00b7info) is the most widely spoken constructed international auxiliary language."
],
[
"Danish",
"Danish language",
"da",
178310,
1079,
66,
"Danish (dansk, pronounced\u00a0[d\u0325an\u02c0s\u0261\u030a]\u00a0( listen); dansk sprog, [\u02c8d\u0325an\u02c0s\u0261\u030a \u02c8sb\u0325\u0281\u0254\u028a\u032f\u02c0]) is a North Germanic language spoken by around six million people, principally in the country of Denmark and in the region of Southern Schleswig in northern Germany, where it holds minority language status."
],
[
"Lithuanian",
"Lithuanian language",
"lt",
158599,
376,
18,
"Lithuanian (lietuvi\u0173 kalba) is the official state language of Lithuania and is recognized as one of the official languages of the European Union."
],
[
"Basque",
"Basque language",
"eu",
150918,
306,
21,
"Basque (endonym: Euskara, IPA:\u00a0[eus\u033a\u02c8ka\u027ea]) is the ancestral language of the Basque people, who inhabit the Basque Country, a region spanning an area in northeastern Spain and southwestern France."
],
[
"Bulgarian",
"Bulgarian language",
"bg",
147501,
756,
29,
"Bulgarian (\u0431\u044a\u043b\u0433\u0430\u0440\u0441\u043a\u0438 \u0435\u0437\u0438\u043a, pronounced\u00a0[\u02c8b\u0264\u031e\u026b\u0261\u0250rski \u025b\u02c8zik]) is an Indo-European language, a member of the Southern branch of the Slavic language family."
],
[
"Hebrew",
"Hebrew language",
"he",
146423,
2297,
248,
"Hebrew /\u02c8hi\u02d0bru\u02d0/ (\u05e2\u05b4\u05d1\u05b0\u05e8\u05b4\u05d9\u05ea \u02bfIvrit [\u0294iv\u02c8\u0281it]\u00a0( listen) or [\u0295iv\u02c8\u027eit]\u00a0( listen)) is a West Semitic language of the Afroasiatic language family."
],
[
"Croatian",
"Croatian language",
"hr",
137483,
512,
36,
"Croatian (hrvatski jezik) is a standardized register of the Serbo-Croatian language used by Croats, principally in Croatia, Bosnia and Herzegovina, the Serbian province of Vojvodina and other neighbouring countries."
],
[
"Slovenian",
"Slovenian language",
"sl",
137136,
530,
20,
"Slovene or Slovenian (slovenski jezik or sloven\u0161\u010dina, not to be confused with sloven\u010dina, the native name of Slovak) belongs to the group of South Slavic languages."
],
[
"Uzbek",
"Uzbek language",
"uz",
122125,
84,
41,
"Uzbek (o\u02bbzbek tili or o\u02bbzbekcha in Latin script; \u045e\u0437\u0431\u0435\u043a \u0442\u0438\u043b\u0438 or \u045e\u0437\u0431\u0435\u043a\u0447\u0430 in Cyrillic script; \u0627\u0648\u0632\u0628\u06cc\u06a9 \u062a\u06cc\u0644\u06cc or \u0627\u0648\u0632\u0628\u06cc\u06a9\u0686\u0647 in Arabic script) is a Turkic language and the official language of Uzbekistan."
],
[
"Volap\u00fck",
"Volap\u00fck language",
"vo",
119097,
34,
15,
"Volap\u00fck (/\u02c8v\u0252l\u0259p\u028ak/; [vola\u02c8pyk]) is a constructed language, created in 1879\u20131880 by Johann Martin Schleyer, a Roman Catholic priest in Baden, Germany."
],
[
"Estonian",
"Estonian language",
"et",
111246,
486,
31,
"Estonian (eesti keel\u00a0 pronounced\u00a0[\u02c8e\u02d0sti \u02c8ke\u02d0l]\u00a0( listen)) is the official language of Estonia, spoken natively by about 1.1 million people in Estonia and tens of thousands in various migrant communities."
],
[
"Hindi",
"Hindi language",
"hi",
105403,
210,
45,
"Hindi, or more precisely Modern Standard Hindi, is a standardised and sanskritised register of the Hindustani language (Hindi-Urdu) that is associated with the Hindu religion."
],
[
"Norwegian (Nynorsk)",
"Norwegian (Nynorsk) language",
"nn",
102885,
232,
20,
"Nynorsk, Neo Norwegian or New Norwegian is one of two official written standards for the Norwegian language, the other being Bokm\u00e5l."
],
[
"Galician",
"Galician language",
"gl",
102175,
286,
19,
"Galician /\u0261\u0259\u02c8l\u026a\u0283\u0259n/ or /\u0261\u0259\u02c8l\u026asi.\u0259n/ (galego IPA:\u00a0[\u0261a\u02c8le\u0263o]) is a language of the Western Ibero-Romance branch."
],
[
"Simple English",
"Simple English language",
"simple",
98950,
732,
76,
null
],
[
"Azerbaijani",
"Azerbaijani language",
"az",
94642,
381,
27,
"Azerbaijani or Azeri (Az\u0259rbaycanca, Az\u0259rbaycan dili) is a language belonging to the Turkic language family, spoken in southwestern Asia by the Azerbaijani people, primarily in the Republic of Azerbaijan (8 million speakers), in northwestern Iran (10 to 12 million speakers) and in the Republic of Georgia, Russia, Turkey and in other countries with a presence of Azerbaijani speakers (6 million speakers)."
],
[
"Latin",
"Latin language",
"la",
90473,
236,
12,
"Latin (i/\u02c8l\u00e6t\u0268n/; Latin: lingua lat\u012bna; IPA:\u00a0[\u02c8l\u026a\u014b\u0261\u02b7a la\u02c8ti\u02d0na]) is an ancient Italic language originally spoken by the Italic Latins in Latium and Ancient Rome."
],
[
"Greek",
"Greek language",
"el",
87530,
732,
48,
"Greek (\u03b5\u03bb\u03bb\u03b7\u03bd\u03b9\u03ba\u03ac [elini\u02c8ka] ellinik\u00e1 or \u03b5\u03bb\u03bb\u03b7\u03bd\u03b9\u03ba\u03ae \u03b3\u03bb\u03ce\u03c3\u03c3\u03b1 [elini\u02c8ci \u02c8\u0263losa] ellinik\u00ed gl\u00f3ssa) is an independent branch of the Indo-European family of languages."
],
[
"Serbo-Croatian",
"Serbo-Croatian language",
"sh",
81258,
216,
20,
"Serbo-Croatian, or Serbo-Croat, less commonly Bosnian/Croatian/Serbian (BCS), is a South Slavic language and the primary language of Serbia, Croatia, Bosnia and Herzegovina, Montenegro."
],
[
"Thai",
"Thai language",
"th",
81081,
1012,
208,
"Thai, or more precisely Siamese or Central Thai, is the national and official language of Thailand and the native language of the Thai people, Thailand's dominant ethnic group."
],
[
"Georgian",
"Georgian language",
"ka",
75756,
201,
38,
"Georgian (\u10e5\u10d0\u10e0\u10d7\u10e3\u10da\u10d8 \u10d4\u10dc\u10d0, pronounced\u00a0[k\u02b0art\u02b0uli \u025bna]) is the native language of the Georgians and the official language of Georgia, a country in the Caucasus."
],
[
"Macedonian",
"Macedonian language",
"mk",
72106,
515,
0,
"Macedonian (\u043c\u0430\u043a\u0435\u0434\u043e\u043d\u0441\u043a\u0438 \u0458\u0430\u0437\u0438\u043a, makedonski jazik, pronounced\u00a0[ma\u02c8k\u025bd\u0254nski \u02c8jazik]\u00a0( listen)) is a South Slavic language, spoken as a first language by some two million people, principally in the Republic of Macedonia and the Macedonian diaspora, with a smaller number of speakers throughout the transnational region of Macedonia."
],
[
"Occitan",
"Occitan language",
"oc",
71969,
109,
8,
"Occitan (English pronunciation: /\u02c8\u0252ks\u026a\u02cct\u00e6n/; French:\u00a0[\u0254k.si't\u0251\u0303]; Occitan:\u00a0[utsi\u02c8ta]), known also as Lenga d'\u00f2c by its native speakers (Occitan:\u00a0[\u02c8le\u014b\u0261\u0254 \u02c8\u00f0\u0254(k)]; French: Langue d'oc), is a Romance language spoken in southern France, Italy's Occitan Valleys, Monaco, and Catalonia's Val d'Aran: the regions sometimes known unofficially as Occitania."
],
[
"Newar / Nepal Bhasa",
"Newar / Nepal Bhasa language",
"new",
70069,
29,
12,
"Nepal Bhasa (\u0928\u0947\u092a\u093e\u0932 \u092d\u093e\u0937\u093e, N\u0113p\u0101l bh\u0101\u1e63\u0101, also known as New\u0101h Bh\u0101y) is one of the major languages of Nepal."
],
[
"Piedmontese",
"Piedmontese language",
"pms",
61486,
37,
2,
"Piedmontese (Italian: Piemontese, Piedmontese: Piemont\u00e8is) is a Romance language spoken by over 1 million people in Piedmont, northwest Italy."
],
[
"Tagalog",
"Tagalog language",
"tl",
61433,
113,
33,
"Tagalog /t\u0259\u02c8\u0261\u0251\u02d0l\u0252\u0261/ (Tagalog:\u00a0[t\u0250\u02c8\u0261a\u02d0lo\u0261]) is an Austronesian language spoken as a first language by a quarter of the population of the Philippines and as a second language by most of the rest."
],
[
"Belarusian",
"Belarusian language",
"be",
59512,
227,
22,
"The Belarusian language (\u0431\u0435\u043b\u0430\u0440\u0443\u0441\u043a\u0430\u044f \u043c\u043e\u0432\u0430, BGN/PCGN: byelaruskaya mova, Scientific: bielaruskaja mova, \u0142ac.: bie\u0142aruskaja mova), sometimes referred to as White Ruthenian, is the language of the Belarusian people."
],
[
"Tamil",
"Tamil language",
"ta",
53429,
253,
32,
"Tamil /\u02c8t\u00e6m\u026al/ (\u0ba4\u0bae\u0bbf\u0bb4\u0bcd, tami\u1e3b,\u00a0[t\u032a\u0250m\u0268\u027b]\u00a0?) is a Dravidian language spoken predominantly by Tamil people of South India and North-east Sri Lanka."
],
[
"Haitian",
"Haitian language",
"ht",
53204,
30,
0,
"Haitian Creole (Krey\u00f2l ayisyen; pronounced:\u00a0[k\u0263ej\u0254l ajisj\u025b\u0303] French: Cr\u00e9ole ha\u00eftien), often called simply Creole or Krey\u00f2l, is a language spoken by about twelve million people,[citation needed] which includes virtually the entire population of Haiti and via emigration, by about two to three million speakers residing in the Bahamas, Belize, Canada, Cayman Islands, Cuba, Dominican Republic, France, French Guiana, Guadeloupe, Ivory Coast, Martinique, Puerto Rico, Trinidad and Tobago, the United States, and Venezuela."
],
[
"Telugu",
"Telugu language",
"te",
52081,
110,
13,
"Telugu /\u02c8t\u025bl\u028a\u0261u\u02d0/ (\u0c24\u0c46\u0c32\u0c41\u0c17\u0c41 telugu, IPA:\u00a0[t\u032ael\u032au\u0261u]) is a Dravidian language predominantly spoken in the South Indian state of Andhra Pradesh where it is an official language."
],
[
"Belarusian (Tara\u0161kievica)",
"Belarusian (Tara\u0161kievica) language",
"be-x-old",
49061,
159,
32,
"Tara\u0161kievica or Belarusian Classical Orthography ([tara\u0282\u02c8k\u02b2\u025bv\u02b2it\u0361sa]; Belarusian: \u0442\u0430\u0440\u0430\u0448\u043a\u0435\u0432\u0456\u0446\u0430, \u043a\u043b\u044f\u0441\u044b\u0447\u043d\u044b \u043f\u0440\u0430\u0432\u0430\u043f\u0456\u0441) is a variant of the orthography of the Belarusian language, based on the literary norm of the modern Belarusian language, the first normalization of which was made by Branis\u0142a\u016d Tara\u0161kievi\u010d in 1918, and was in official use in Belarus until the Belarusian orthography reform of 1933."
],
[
"Welsh",
"Welsh language",
"cy",
48791,
100,
28,
"Welsh (Cymraeg or y Gymraeg, pronounced [k\u0259m\u02c8r\u0251\u02d0\u0268\u0261, \u0259 \u0261\u0259m\u02c8r\u0251\u02d0\u0268\u0261]) is a member of the Brythonic branch of the Celtic languages spoken natively in Wales, by some along the Welsh border in England, and in Y Wladfa (the Welsh colony in Chubut Province, Argentina)."
],
[
"Latvian",
"Latvian language",
"lv",
48506,
269,
100,
"Latvian (latvie\u0161u valoda) is the official state language of Latvia."
],
[
"Bosnian",
"Bosnian language",
"bs",
45940,
180,
149,
"Bosnian (bosanski / \u0431\u043e\u0441\u0430\u043d\u0441\u043a\u0438 [b\u0254\u030csanski\u02d0]) is a standardized register of the Serbo-Croatian language, a South Slavic language, used by Bosniaks."
],
[
"Albanian",
"Albanian language",
"sq",
45630,
218,
27,
"Albanian (gjuha shqipe [\u02c8\u025fuha \u02c8\u0283cip\u025b] or shqip [\u0283cip]) is an Indo-European language spoken by approximately 7.4 million people all over the world, primarily in Albania and Kosovo but also in other areas of the Balkans in which there is an Albanian population, including western Republic of Macedonia, southern Montenegro, Greece and Italy."
],
[
"Breton",
"Breton language",
"br",
45630,
105,
20,
"Breton /\u02c8br\u025bt\u0259n/ (Brezhoneg) is a Celtic language spoken in Brittany (Breton: Breizh; French: Bretagne), France."
],
[
"Armenian",
"Armenian language",
"hy",
45444,
199,
83,
"The Armenian language (Armenian: \u0570\u0561\u0575\u0565\u0580\u0565\u0576, Armenian pronunciation:\u00a0[h\u0251j\u025b\u02c8\u027e\u025bn], hayeren) is an Indo-European language spoken by the Armenians."
],
[
"Malagasy",
"Malagasy language",
"mg",
45362,
29,
32,
"Malagasy /m\u00e6l\u0259\u02c8\u0261\u00e6si/ (Malagasy:\u00a0[\u02ccmala\u02c8\u0261as\u02b2]) is an Austronesian language and the national language of Madagascar."
],
[
"Tatar",
"Tatar language",
"tt",
43885,
66,
10,
"Tatar or Kazan Tatar (\u0442\u0430\u0442\u0430\u0440 \u0442\u0435\u043b\u0435, \u0442\u0430\u0442\u0430\u0440\u0447\u0430, tatar tele, tatar\u00e7a, \u062a\u0627\u062a\u0627\u0631 \u062a\u064a\u0644\u06cc) is a Turkic language spoken by the Tatars of the historical Kazan Khanate, including modern Tatarstan and Bashkortostan."
],
[
"Javanese",
"Javanese language",
"jv",
43783,
84,
13,
"Javanese /d\u0292\u0251\u02d0v\u0259\u02c8ni\u02d0z/ (Javanese: \ua9a7\ua9b1\ua997\ua9ae basa Jawa; Indonesian: bahasa Jawa) is the language of the Javanese people from the central and eastern parts of the island of Java, in Indonesia."
],
[
"Marathi",
"Marathi language",
"mr",
38740,
121,
53,
"Marathi /m\u0259\u02c8r\u0251\u02d0ti/ (\u092e\u0930\u093e\u0920\u0940 Mar\u0101\u1e6dh\u012b [m\u0259\u02c8\u027ea\u0288\u02b0i]) is an Indo-Aryan language."
],
[
"Luxembourgish",
"Luxembourgish language",
"lb",
38672,
86,
22,
"Luxembourgish (L\u00ebtzebuergesch) is a High German language that is spoken mainly in Luxembourg."
],
[
"Icelandic",
"Icelandic language",
"is",
35768,
158,
43,
"Icelandic (\u00a0\u00edslenska\u00a0(help\u00b7info)) is a North Germanic language, the main language of Iceland."
],
[
"Burmese",
"Burmese language",
"my",
31309,
49,
1,
"The Burmese language (Burmese: \u1019\u103c\u1014\u103a\u1019\u102c\u1018\u102c\u101e\u102c; pronounced:\u00a0[mj\u0259m\u00e0 b\u00e0\u00f0\u00e0]; MLCTS: myanma bhasa) is the official language of Burma."
],
[
"Yoruba",
"Yoruba language",
"yo",
30584,
35,
5,
"Yoruba /\u02c8j\u0252r\u028ab\u0259/ (natively \u00e8d\u00e8 Yor\u00f9b\u00e1) is a Niger\u2013Congo language spoken in West Africa."
],
[
"Bashkir",
"Bashkir language",
"ba",
30544,
58,
8,
"The Bashkir language (\u0411\u0430\u0448\u04a1\u043e\u0440\u0442 \u0442\u0435\u043b\u0435 ba\u015fqort tele, pronounced [ba\u0282.\u02ccq\u028a\u031ert.t\u026a\u031e.\u02c8l\u026a\u031e]\u00a0( listen)) is a Turkic language, and is the language of the Bashkirs."
],
[
"Malayalam",
"Malayalam language",
"ml",
30541,
293,
296,
"Malayalam /m\u00e6l\u0259\u02c8j\u0251\u02d0l\u0259m/ (\u0d2e\u0d32\u0d2f\u0d3e\u0d33\u0d02, malay\u0101\u1e37am\u00a0?, Malayalam pronunciation:\u00a0\u200b[m\u0250l\u0259ja\u02d0\u026d\u0259m]), is a language spoken in India, predominantly in the state of Kerala."
],
[
"Aragonese",
"Aragonese language",
"an",
29172,
87,
85,
"Aragonese (pron.: /\u02cc\u00e6r\u0259\u0261\u0252\u02c8ni\u02d0z/; aragon\u00e9s [a\u027ea\u0263o\u02c8nes] in Aragonese) is a Romance language spoken by between 10,000 and 30,000 people throughout the valleys of the Pyrenees in Aragon, Spain, mainly in the comarcas of Somontano de Barbastro, Jacetania, Alto G\u00e1llego, Sobrarbe, and Ribagorza."
],
[
"Lombard",
"Lombard language",
"lmo",
28669,
59,
32,
"Lombard is a member of the Cisalpine or Gallo-Italic group within the Romance languages."
],
[
"Afrikaans",
"Afrikaans language",
"af",
26806,
150,
38,
"Afrikaans /\u00e6fr\u026a\u02c8k\u0251\u02d0ns/ is a West Germanic language, spoken natively in South Africa, Namibia and to a lesser extent in Botswana and Zimbabwe."
],
[
"West Frisian",
"West Frisian language",
"fy",
26497,
77,
14,
"West Frisian (Frysk, Dutch: Westerlauwers Fries [\u02c8\u028b\u025bst\u0259r\u02ccl\u028cu\u032f\u0259rs \u02c8fris]) is a language spoken mostly in the province of Friesland (Frysl\u00e2n) in the north of the Netherlands."
],
[
"Western Panjabi",
"Western Panjabi language",
"pnb",
26352,
38,
0,
"Punjabi /p\u028cn\u02c8d\u0292\u0251\u02d0bi/ (Gurmukhi: \u0a2a\u0a70\u0a1c\u0a3e\u0a2c\u0a40, Shahmukhi: \u067e\u0646\u062c\u0627\u0628\u06cc, Devanagari: \u092a\u0902\u091c\u093e\u092c\u0940) Punjabi is an Indo-Aryan language spoken by inhabitants of the historical Punjab region (India and Pakistan)."
],
[
"Bengali",
"Bengali language",
"bn",
26041,
288,
0,
"Bengali /b\u025b\u014b\u02c8\u0261\u0254\u02d0li/ (\u09ac\u09be\u0982\u09b2\u09be Bangla [\u02c8ba\u014bla]\u00a0( listen)) is an eastern Indo-Aryan language."
],
[
"Swahili",
"Swahili language",
"sw",
25272,
62,
37,
"The Swahili language (Arabic: \u0633\u0648\u0627\u062d\u0644\u064a\u200e), or Kiswahili, is a Bantu language and it is the mother tongue of the Swahili People (Waswahili) spoken in East and Central africa by various ethnic groups that inhabit several large stretches of the Mozambique Channel coastline from northern Kenya to northern Mozambique."
],
[
"Bishnupriya Manipuri",
"Bishnupriya Manipuri language",
"bpy",
24800,
24,
23,
"The Bishnupriya or Bishnupriya Manipuri (BPM) (\u09ac\u09bf\u09b7\u09cd\u09a3\u09c1\u09aa\u09cd\u09b0\u09bf\u09af\u09bc\u09be \u09ae\u09a3\u09bf\u09aa\u09c1\u09b0\u09c0) is an Indo-Aryan language spoken in parts of the Indian states of Assam, Tripura and others, as well as in Sylhet region of Bangladesh, Burma, and other countries."
],
[
"Ido",
"Ido language",
"io",
24777,
51,
5,
"Ido (pron.: /\u02c8i\u02d0do\u028a/) is a language created to be a universal second language for speakers of diverse backgrounds."
],
[
"Kirghiz",
"Kirghiz language",
"ky",
24460,
54,
1,
"Kyrgyz /\u02c8k\u026a\u0259r\u0261\u026az/ (Kirgiz), also Kirghiz /k\u026a\u0259r\u02c8\u0261i\u02d0z/ (\u041a\u044b\u0440\u0433\u044b\u0437\u0447\u0430 or \u041a\u044b\u0440\u0433\u044b\u0437 \u0442\u0438\u043b\u0438, \u0642\u0649\u0631\u0639\u0649\u0632 \u062a\u0649\u0644\u0649, K\u0131rg\u0131z\u00e7a or K\u0131rg\u0131z tili) is a language of the Turkic language family and one of the main official languages of Kyrgyzstan, the other one being Russian."
],
[
"Urdu",
"Urdu language",
"ur",
24060,
78,
77,
"Urdu pron.: /\u02c8\u028a\u0259rdu\u02d0/ (Urdu: \u0627\u064f\u0631\u062f\u064f\u0648\u200e, Urd\u016b, Urdu pronunciation:\u00a0[\u02c8\u028ard\u032au]\u00a0( listen)), or more precisely Modern Standard Urdu, is a standardized register of the Hindustani language that is associated with the Muslim religion."
],
[
"Nepali",
"Nepali language",
"ne",
23290,
75,
10,
"Nepali (\u0928\u0947\u092a\u093e\u0932\u0940) is a language in the Indo-Aryan languages ."
],
[
"Sicilian",
"Sicilian language",
"scn",
22970,
61,
22,
"Sicilian (lu sicilianu, Italian: lingua siciliana, also known as Siculu or Calabro-Sicilian) is a Romance language."
],
[
"Cantonese",
"Cantonese language",
"zh-yue",
22849,
164,
54,
"Cantonese, or Standard Cantonese (simplified Chinese: \u5e7f\u5dde\u8bdd; traditional Chinese: \u5ee3\u5dde\u8a71), is a language that originated in the vicinity of Canton (i.e., Guangzhou) in southern China, and is often regarded as the prestige dialect of Yue."
],
[
"Gujarati",
"Gujarati language",
"gu",
22530,
72,
5,
"Gujarati /\u0261\u028ad\u0292\u0259\u02c8r\u0251\u02d0ti/ (\u0a97\u0ac1\u0a9c\u0ab0\u0abe\u0aa4\u0ac0 Gujar\u0101t\u012b) is an Indo-Aryan language, native to Gujarat, Daman and Diu and Dadra and Nagar Haveli in India."
],
[
"Low Saxon",
"Low Saxon language",
"nds",
20511,
61,
31,
"Low German or Low Saxon (Plattd\u00fc\u00fctsch, Nedderd\u00fc\u00fctsch; Standard German: Plattdeutsch or Niederdeutsch; Dutch: Nedersaksisch in the wider sense."
],
[
"Irish",
"Irish language",
"ga",
19677,
55,
17,
"Irish (Gaeilge), also known as Irish Gaelic or Gaelic, is a Goidelic language of the Indo-European language family, originating in Ireland and historically spoken by the Irish people."
],
[
"Kurdish",
"Kurdish language",
"ku",
19627,
63,
25,
"Kurdish (Kurdish: Kurd\u00ee or \u06a9\u0648\u0631\u062f\u06cc) is a dialect continuum spoken by the Kurds in western Asia."
],
[
"Asturian",
"Asturian language",
"ast",
18668,
76,
15,
"Asturian (pron.: /\u00e6s\u02c8t\u028a\u0259ri\u0259n/; autonym: asturianu [astu'\u027ejanu], or bable [\u02c8ba\u03b2le]) is a Romance language of the West Iberian group, Astur-Leonese subgroup, spoken in Asturias (Spain)."
],
[
"Quechua",
"Quechua language",
"qu",
18122,
35,
37,
"Quechua (endonym \"Runa Simi\") is a Native South American language family spoken primarily in the Andes of South America, derived from a common ancestral language."
],
[
"Sundanese",
"Sundanese language",
"su",
17484,
41,
14,
"Sundanese /s\u028cnd\u0259\u02c8ni\u02d0z/ (Basa Sunda, in Sundanese script \u1b98\u1b9e \u1b9e\u1ba5\u1b94\u1baa\u1b93, literally \"language of Sunda\") is the language of about 39 million people from the western third of Java or about 15% of the Indonesian population."
],
[
"Chuvash",
"Chuvash language",
"cv",
15566,
46,
18,
"Chuvash (\u0427\u04d1\u0432\u0430\u0448\u043b\u0430, \u010c\u0103va\u0161la; IPA:\u00a0[t\u0255\u0259\u028ba\u0282\u02c8la]) is a Turkic language spoken in central Russia, primarily in the Chuvash Republic and adjacent areas."
],
[
"Scots",
"Scots language",
"sco",
14482,
68,
42,
"Scots is the Germanic language variety spoken in Lowland Scotland and parts of Ulster (where the local dialect is known as Ulster Scots)."
],
[
"Alemannic",
"Alemannic language",
"als",
14417,
94,
29,
"Alemannic (German: \u00a0Alemannisch\u00a0(help\u00b7info)) is a group of dialects of the Upper German branch of the Germanic language family."
],
[
"Interlingua",
"Interlingua language",
"ia",
13978,
52,
11,
"Interlingua (pron.: /\u026ant\u0259r\u02c8l\u026a\u014b\u0261w\u0259/; ISO 639 language codes ia, ina) is an international auxiliary language (IAL), developed between 1937 and 1951 by the International Auxiliary Language Association (IALA)."
],
[
"Neapolitan",
"Neapolitan language",
"nap",
13826,
35,
22,
"Neapolitan (autonym: nnapulitano; Italian: napoletano), also known as Southern Italian and Neapolitan\u2013Calabrian, is the language of southern continental Italy, including the city of Naples."
],
[
"Buginese",
"Buginese language",
"bug",
13819,
17,
1,
"Buginese (Basa Ugi, elsewhere also Bahasa Bugis, Bugis, Bugi, De) is the language spoken by about four million people mainly in the southern part of Sulawesi, Indonesia."
],
[
"Samogitian",
"Samogitian language",
"bat-smg",
13456,
26,
8,
"Samogitian (Samogitian: \u017demaitiu ruoda, Lithuanian: \u017demai\u010di\u0173 tarm\u0117) is a dialect of the Lithuanian language spoken mostly in Samogitia (in the western part of Lithuania)."
],
[
"Kannada",
"Kannada language",
"kn",
13034,
131,
27,
"Kannada /\u02c8k\u00e6n\u0259d\u0259/, (\u0c95\u0ca8\u0ccd\u0ca8\u0ca1 kanna\u1e0da, IPA:\u00a0[\u02c8k\u028cn\u02d0\u0259\u0256\u0251\u02d0]) or Kanarese /k\u00e6n\u0259\u02c8ri\u02d0z/, is a language spoken in India predominantly in the state of Karnataka."
],
[
"Banyumasan",
"Banyumasan language",
"map-bms",
12993,
23,
7,
"The Banyumasan language, colloquially known as Basa Ngapak, spoken on the island of Java, is usually considered a dialect of Javanese in modern language classification."
],
[
"Walloon",
"Walloon language",
"wa",
12803,
27,
23,
"Walloon (Walon in Walloon) is a Romance language that was spoken as a primary language in large portions (70%) of the Walloon Region of Belgium, in some villages of Northern France (near Givet) and in the northeast part of Wisconsin until the middle of the 20th century."
],
[
"Amharic",
"Amharic language",
"am",
12445,
31,
35,
"Amharic /\u00e6m\u02c8h\u00e6r\u026ak/ or /\u0251\u02d0m\u02c8h\u0251r\u026ak/ (Amharic: \u12a0\u121b\u122d\u129b?, Amar\u0259\u00f1\u00f1a, IPA:\u00a0[amar\u0268\u0272\u02d0a]\u00a0( listen)) is a Semitic language spoken in Ethiopia."
],
[
"Sorani",
"Sorani language",
"ckb",
12160,
66,
27,
"Soran\u00ee (\u06a9\u0648\u0631\u062f\u06cc\u06cc \u0646\u0627\u0648\u06d5\u0646\u062f\u06cc, \u0633\u06c6\u0631\u0627\u0646\u06cc; also called Central Kurdish) is a Kurdish dialect spoken in Iran and Iraq."
],