Skip to content

Instantly share code, notes, and snippets.

@tavlima
Created February 14, 2013 20:38
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 1 You must be signed in to fork a gist
  • Save tavlima/4956195 to your computer and use it in GitHub Desktop.
Save tavlima/4956195 to your computer and use it in GitHub Desktop.
Languages and three letters code (ISO 639-2) Using only the bibliographic (B) codes From http://www.loc.gov/standards/iso639-2/php/code_list.php Last update: 2013-02-14
<?php
// From http://www.loc.gov/standards/iso639-2/php/code_list.php
// Last update: 2013-02-14
// Using only the bibliographic (B) codes
$languages = array(
'aar' => "Afar",
'abk' => "Abkhazian",
'ace' => "Achinese",
'ach' => "Acoli",
'ada' => "Adangme",
'ady' => "Adyghe; Adygei",
'afh' => "Afrihili",
'afr' => "Afrikaans",
'afa' => "Afro-Asiatic languages",
'ain' => "Ainu",
'aka' => "Akan",
'akk' => "Akkadian",
'alb' => "Albanian",
'ale' => "Aleut",
'alg' => "Algonquian languages",
'tut' => "Altaic languages",
'amh' => "Amharic",
'anp' => "Angika",
'apa' => "Apache languages",
'ara' => "Arabic",
'arg' => "Aragonese",
'arp' => "Arapaho",
'arw' => "Arawak",
'arm' => "Armenian",
'rup' => "Aromanian; Arumanian; Macedo-Romanian",
'art' => "Artificial languages",
'asm' => "Assamese",
'ast' => "Asturian; Bable; Leonese; Asturleonese",
'ath' => "Athapascan languages",
'aus' => "Australian languages",
'map' => "Austronesian languages",
'ava' => "Avaric",
'ave' => "Avestan",
'awa' => "Awadhi",
'aym' => "Aymara",
'aze' => "Azerbaijani",
'ban' => "Balinese",
'bat' => "Baltic languages",
'bal' => "Baluchi",
'bam' => "Bambara",
'bai' => "Bamileke languages",
'bad' => "Banda languages",
'bnt' => "Bantu languages",
'bas' => "Basa",
'bak' => "Bashkir",
'baq' => "Basque",
'btk' => "Batak languages",
'bej' => "Beja; Bedawiyet",
'bel' => "Belarusian",
'bem' => "Bemba",
'ben' => "Bengali",
'ber' => "Berber languages",
'bho' => "Bhojpuri",
'bih' => "Bihari languages",
'bik' => "Bikol",
'bin' => "Bini; Edo",
'bis' => "Bislama",
'byn' => "Blin; Bilin",
'zbl' => "Blissymbols; Blissymbolics; Bliss",
'nob' => "Bokmål, Norwegian; Norwegian Bokmål",
'bos' => "Bosnian",
'bra' => "Braj",
'bre' => "Breton",
'bug' => "Buginese",
'bul' => "Bulgarian",
'bua' => "Buriat",
'bur' => "Burmese",
'cad' => "Caddo",
'cat' => "Catalan; Valencian",
'cau' => "Caucasian languages",
'ceb' => "Cebuano",
'cel' => "Celtic languages",
'cai' => "Central American Indian languages",
'khm' => "Central Khmer",
'chg' => "Chagatai",
'cmc' => "Chamic languages",
'cha' => "Chamorro",
'che' => "Chechen",
'chr' => "Cherokee",
'chy' => "Cheyenne",
'chb' => "Chibcha",
'nya' => "Chichewa; Chewa; Nyanja",
'chi' => "Chinese",
'chn' => "Chinook jargon",
'chp' => "Chipewyan; Dene Suline",
'cho' => "Choctaw",
'chu' => "Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic",
'chk' => "Chuukese",
'chv' => "Chuvash",
'nwc' => "Classical Newari; Old Newari; Classical Nepal Bhasa",
'syc' => "Classical Syriac",
'cop' => "Coptic",
'cor' => "Cornish",
'cos' => "Corsican",
'cre' => "Cree",
'mus' => "Creek",
'crp' => "Creoles and pidgins",
'cpe' => "Creoles and pidgins, English based",
'cpf' => "Creoles and pidgins, French-based",
'cpp' => "Creoles and pidgins, Portuguese-based",
'crh' => "Crimean Tatar; Crimean Turkish",
'hrv' => "Croatian",
'cus' => "Cushitic languages",
'cze' => "Czech",
'dak' => "Dakota",
'dan' => "Danish",
'dar' => "Dargwa",
'del' => "Delaware",
'din' => "Dinka",
'div' => "Divehi; Dhivehi; Maldivian",
'doi' => "Dogri",
'dgr' => "Dogrib",
'dra' => "Dravidian languages",
'dua' => "Duala",
'dum' => "Dutch, Middle (ca.1050-1350)",
'dut' => "Dutch; Flemish",
'dyu' => "Dyula",
'dzo' => "Dzongkha",
'frs' => "Eastern Frisian",
'efi' => "Efik",
'egy' => "Egyptian (Ancient)",
'eka' => "Ekajuk",
'elx' => "Elamite",
'eng' => "English",
'enm' => "English, Middle (1100-1500)",
'ang' => "English, Old (ca.450-1100)",
'myv' => "Erzya",
'epo' => "Esperanto",
'est' => "Estonian",
'ewe' => "Ewe",
'ewo' => "Ewondo",
'fan' => "Fang",
'fat' => "Fanti",
'fao' => "Faroese",
'fij' => "Fijian",
'fil' => "Filipino; Pilipino",
'fin' => "Finnish",
'fiu' => "Finno-Ugrian languages",
'fon' => "Fon",
'fre' => "French",
'frm' => "French, Middle (ca.1400-1600)",
'fro' => "French, Old (842-ca.1400)",
'fur' => "Friulian",
'ful' => "Fulah",
'gaa' => "Ga",
'gla' => "Gaelic; Scottish Gaelic",
'car' => "Galibi Carib",
'glg' => "Galician",
'lug' => "Ganda",
'gay' => "Gayo",
'gba' => "Gbaya",
'gez' => "Geez",
'geo' => "Georgian",
'ger' => "German",
'gmh' => "German, Middle High (ca.1050-1500)",
'goh' => "German, Old High (ca.750-1050)",
'gem' => "Germanic languages",
'gil' => "Gilbertese",
'gon' => "Gondi",
'gor' => "Gorontalo",
'got' => "Gothic",
'grb' => "Grebo",
'grc' => "Greek, Ancient (to 1453)",
'gre' => "Greek, Modern (1453-)",
'grn' => "Guarani",
'guj' => "Gujarati",
'gwi' => "Gwich'in",
'hai' => "Haida",
'hat' => "Haitian; Haitian Creole",
'hau' => "Hausa",
'haw' => "Hawaiian",
'heb' => "Hebrew",
'her' => "Herero",
'hil' => "Hiligaynon",
'him' => "Himachali languages; Western Pahari languages",
'hin' => "Hindi",
'hmo' => "Hiri Motu",
'hit' => "Hittite",
'hmn' => "Hmong; Mong",
'hun' => "Hungarian",
'hup' => "Hupa",
'iba' => "Iban",
'ice' => "Icelandic",
'ido' => "Ido",
'ibo' => "Igbo",
'ijo' => "Ijo languages",
'ilo' => "Iloko",
'smn' => "Inari Sami",
'inc' => "Indic languages",
'ine' => "Indo-European languages",
'ind' => "Indonesian",
'inh' => "Ingush",
'ina' => "Interlingua (International Auxiliary Language Association)",
'ile' => "Interlingue; Occidental",
'iku' => "Inuktitut",
'ipk' => "Inupiaq",
'ira' => "Iranian languages",
'gle' => "Irish",
'mga' => "Irish, Middle (900-1200)",
'sga' => "Irish, Old (to 900)",
'iro' => "Iroquoian languages",
'ita' => "Italian",
'jpn' => "Japanese",
'jav' => "Javanese",
'jrb' => "Judeo-Arabic",
'jpr' => "Judeo-Persian",
'kbd' => "Kabardian",
'kab' => "Kabyle",
'kac' => "Kachin; Jingpho",
'kal' => "Kalaallisut; Greenlandic",
'xal' => "Kalmyk; Oirat",
'kam' => "Kamba",
'kan' => "Kannada",
'kau' => "Kanuri",
'kaa' => "Kara-Kalpak",
'krc' => "Karachay-Balkar",
'krl' => "Karelian",
'kar' => "Karen languages",
'kas' => "Kashmiri",
'csb' => "Kashubian",
'kaw' => "Kawi",
'kaz' => "Kazakh",
'kha' => "Khasi",
'khi' => "Khoisan languages",
'kho' => "Khotanese; Sakan",
'kik' => "Kikuyu; Gikuyu",
'kmb' => "Kimbundu",
'kin' => "Kinyarwanda",
'kir' => "Kirghiz; Kyrgyz",
'tlh' => "Klingon; tlhIngan-Hol",
'kom' => "Komi",
'kon' => "Kongo",
'kok' => "Konkani",
'kor' => "Korean",
'kos' => "Kosraean",
'kpe' => "Kpelle",
'kro' => "Kru languages",
'kua' => "Kuanyama; Kwanyama",
'kum' => "Kumyk",
'kur' => "Kurdish",
'kru' => "Kurukh",
'kut' => "Kutenai",
'lad' => "Ladino",
'lah' => "Lahnda",
'lam' => "Lamba",
'day' => "Land Dayak languages",
'lao' => "Lao",
'lat' => "Latin",
'lav' => "Latvian",
'lez' => "Lezghian",
'lim' => "Limburgan; Limburger; Limburgish",
'lin' => "Lingala",
'lit' => "Lithuanian",
'jbo' => "Lojban",
'nds' => "Low German; Low Saxon; German, Low; Saxon, Low",
'dsb' => "Lower Sorbian",
'loz' => "Lozi",
'lub' => "Luba-Katanga",
'lua' => "Luba-Lulua",
'lui' => "Luiseno",
'smj' => "Lule Sami",
'lun' => "Lunda",
'luo' => "Luo (Kenya and Tanzania)",
'lus' => "Lushai",
'ltz' => "Luxembourgish; Letzeburgesch",
'mac' => "Macedonian",
'mad' => "Madurese",
'mag' => "Magahi",
'mai' => "Maithili",
'mak' => "Makasar",
'mlg' => "Malagasy",
'may' => "Malay",
'mal' => "Malayalam",
'mlt' => "Maltese",
'mnc' => "Manchu",
'mdr' => "Mandar",
'man' => "Mandingo",
'mni' => "Manipuri",
'mno' => "Manobo languages",
'glv' => "Manx",
'mao' => "Maori",
'arn' => "Mapudungun; Mapuche",
'mar' => "Marathi",
'chm' => "Mari",
'mah' => "Marshallese",
'mwr' => "Marwari",
'mas' => "Masai",
'myn' => "Mayan languages",
'men' => "Mende",
'mic' => "Mi'kmaq; Micmac",
'min' => "Minangkabau",
'mwl' => "Mirandese",
'moh' => "Mohawk",
'mdf' => "Moksha",
'mkh' => "Mon-Khmer languages",
'lol' => "Mongo",
'mon' => "Mongolian",
'mos' => "Mossi",
'mul' => "Multiple languages",
'mun' => "Munda languages",
'nqo' => "N'Ko",
'nah' => "Nahuatl languages",
'nau' => "Nauru",
'nav' => "Navajo; Navaho",
'nde' => "Ndebele, North; North Ndebele",
'nbl' => "Ndebele, South; South Ndebele",
'ndo' => "Ndonga",
'nap' => "Neapolitan",
'new' => "Nepal Bhasa; Newari",
'nep' => "Nepali",
'nia' => "Nias",
'nic' => "Niger-Kordofanian languages",
'ssa' => "Nilo-Saharan languages",
'niu' => "Niuean",
'zxx' => "No linguistic content; Not applicable",
'nog' => "Nogai",
'non' => "Norse, Old",
'nai' => "North American Indian languages",
'frr' => "Northern Frisian",
'sme' => "Northern Sami",
'nor' => "Norwegian",
'nno' => "Norwegian Nynorsk; Nynorsk, Norwegian",
'nub' => "Nubian languages",
'nym' => "Nyamwezi",
'nyn' => "Nyankole",
'nyo' => "Nyoro",
'nzi' => "Nzima",
'oci' => "Occitan (post 1500)",
'arc' => "Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)",
'oji' => "Ojibwa",
'ori' => "Oriya",
'orm' => "Oromo",
'osa' => "Osage",
'oss' => "Ossetian; Ossetic",
'oto' => "Otomian languages",
'pal' => "Pahlavi",
'pau' => "Palauan",
'pli' => "Pali",
'pam' => "Pampanga; Kapampangan",
'pag' => "Pangasinan",
'pan' => "Panjabi; Punjabi",
'pap' => "Papiamento",
'paa' => "Papuan languages",
'nso' => "Pedi; Sepedi; Northern Sotho",
'per' => "Persian",
'peo' => "Persian, Old (ca.600-400 B.C.)",
'phi' => "Philippine languages",
'phn' => "Phoenician",
'pon' => "Pohnpeian",
'pol' => "Polish",
'por' => "Portuguese",
'pra' => "Prakrit languages",
'pro' => "Provençal, Old (to 1500);Occitan, Old (to 1500)",
'pus' => "Pushto; Pashto",
'que' => "Quechua",
'raj' => "Rajasthani",
'rap' => "Rapanui",
'rar' => "Rarotongan; Cook Islands Maori",
'qaa-qtz' => "Reserved for local use",
'roa' => "Romance languages",
'rum' => "Romanian; Moldavian; Moldovan",
'roh' => "Romansh",
'rom' => "Romany",
'run' => "Rundi",
'rus' => "Russian",
'sal' => "Salishan languages",
'sam' => "Samaritan Aramaic",
'smi' => "Sami languages",
'smo' => "Samoan",
'sad' => "Sandawe",
'sag' => "Sango",
'san' => "Sanskrit",
'sat' => "Santali",
'srd' => "Sardinian",
'sas' => "Sasak",
'sco' => "Scots",
'sel' => "Selkup",
'sem' => "Semitic languages",
'srp' => "Serbian",
'srr' => "Serer",
'shn' => "Shan",
'sna' => "Shona",
'iii' => "Sichuan Yi; Nuosu",
'scn' => "Sicilian",
'sid' => "Sidamo",
'sgn' => "Sign Languages",
'bla' => "Siksika",
'snd' => "Sindhi",
'sin' => "Sinhala; Sinhalese",
'sit' => "Sino-Tibetan languages",
'sio' => "Siouan languages",
'sms' => "Skolt Sami",
'den' => "Slave (Athapascan)",
'sla' => "Slavic languages",
'slo' => "Slovak",
'slv' => "Slovenian",
'sog' => "Sogdian",
'som' => "Somali",
'son' => "Songhai languages",
'snk' => "Soninke",
'wen' => "Sorbian languages",
'sot' => "Sotho, Southern",
'sai' => "South American Indian languages",
'alt' => "Southern Altai",
'sma' => "Southern Sami",
'spa' => "Spanish; Castilian",
'srn' => "Sranan Tongo",
'zgh' => "Standard Moroccan Tamazight",
'suk' => "Sukuma",
'sux' => "Sumerian",
'sun' => "Sundanese",
'sus' => "Susu",
'swa' => "Swahili",
'ssw' => "Swati",
'swe' => "Swedish",
'gsw' => "Swiss German; Alemannic; Alsatian",
'syr' => "Syriac",
'tgl' => "Tagalog",
'tah' => "Tahitian",
'tai' => "Tai languages",
'tgk' => "Tajik",
'tmh' => "Tamashek",
'tam' => "Tamil",
'tat' => "Tatar",
'tel' => "Telugu",
'ter' => "Tereno",
'tet' => "Tetum",
'tha' => "Thai",
'tib' => "Tibetan",
'tig' => "Tigre",
'tir' => "Tigrinya",
'tem' => "Timne",
'tiv' => "Tiv",
'tli' => "Tlingit",
'tpi' => "Tok Pisin",
'tkl' => "Tokelau",
'tog' => "Tonga (Nyasa)",
'ton' => "Tonga (Tonga Islands)",
'tsi' => "Tsimshian",
'tso' => "Tsonga",
'tsn' => "Tswana",
'tum' => "Tumbuka",
'tup' => "Tupi languages",
'tur' => "Turkish",
'ota' => "Turkish, Ottoman (1500-1928)",
'tuk' => "Turkmen",
'tvl' => "Tuvalu",
'tyv' => "Tuvinian",
'twi' => "Twi",
'udm' => "Udmurt",
'uga' => "Ugaritic",
'uig' => "Uighur; Uyghur",
'ukr' => "Ukrainian",
'umb' => "Umbundu",
'mis' => "Uncoded languages",
'und' => "Undetermined",
'hsb' => "Upper Sorbian",
'urd' => "Urdu",
'uzb' => "Uzbek",
'vai' => "Vai",
'ven' => "Venda",
'vie' => "Vietnamese",
'vol' => "Volapük",
'vot' => "Votic",
'wak' => "Wakashan languages",
'wln' => "Walloon",
'war' => "Waray",
'was' => "Washo",
'wel' => "Welsh",
'fry' => "Western Frisian",
'wal' => "Wolaitta; Wolaytta",
'wol' => "Wolof",
'xho' => "Xhosa",
'sah' => "Yakut",
'yao' => "Yao",
'yap' => "Yapese",
'yid' => "Yiddish",
'yor' => "Yoruba",
'ypk' => "Yupik languages",
'znd' => "Zande languages",
'zap' => "Zapotec",
'zza' => "Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki",
'zen' => "Zenaga",
'zha' => "Zhuang; Chuang",
'zul' => "Zulu",
'zun' => "Zuni",
);
?>
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment