Skip to content

Instantly share code, notes, and snippets.

@tavlima
Created February 14, 2013 20:38
Show Gist options
  • Save tavlima/4956195 to your computer and use it in GitHub Desktop.
Save tavlima/4956195 to your computer and use it in GitHub Desktop.

Revisions

  1. tavlima created this gist Feb 14, 2013.
    495 changes: 495 additions & 0 deletions languages-iso-639-2.php
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,495 @@
    <?php

    // From http://www.loc.gov/standards/iso639-2/php/code_list.php
    // Last update: 2013-02-14
    // Using only the bibliographic (B) codes

    $languages = array(
    'aar' => "Afar",
    'abk' => "Abkhazian",
    'ace' => "Achinese",
    'ach' => "Acoli",
    'ada' => "Adangme",
    'ady' => "Adyghe; Adygei",
    'afh' => "Afrihili",
    'afr' => "Afrikaans",
    'afa' => "Afro-Asiatic languages",
    'ain' => "Ainu",
    'aka' => "Akan",
    'akk' => "Akkadian",
    'alb' => "Albanian",
    'ale' => "Aleut",
    'alg' => "Algonquian languages",
    'tut' => "Altaic languages",
    'amh' => "Amharic",
    'anp' => "Angika",
    'apa' => "Apache languages",
    'ara' => "Arabic",
    'arg' => "Aragonese",
    'arp' => "Arapaho",
    'arw' => "Arawak",
    'arm' => "Armenian",
    'rup' => "Aromanian; Arumanian; Macedo-Romanian",
    'art' => "Artificial languages",
    'asm' => "Assamese",
    'ast' => "Asturian; Bable; Leonese; Asturleonese",
    'ath' => "Athapascan languages",
    'aus' => "Australian languages",
    'map' => "Austronesian languages",
    'ava' => "Avaric",
    'ave' => "Avestan",
    'awa' => "Awadhi",
    'aym' => "Aymara",
    'aze' => "Azerbaijani",
    'ban' => "Balinese",
    'bat' => "Baltic languages",
    'bal' => "Baluchi",
    'bam' => "Bambara",
    'bai' => "Bamileke languages",
    'bad' => "Banda languages",
    'bnt' => "Bantu languages",
    'bas' => "Basa",
    'bak' => "Bashkir",
    'baq' => "Basque",
    'btk' => "Batak languages",
    'bej' => "Beja; Bedawiyet",
    'bel' => "Belarusian",
    'bem' => "Bemba",
    'ben' => "Bengali",
    'ber' => "Berber languages",
    'bho' => "Bhojpuri",
    'bih' => "Bihari languages",
    'bik' => "Bikol",
    'bin' => "Bini; Edo",
    'bis' => "Bislama",
    'byn' => "Blin; Bilin",
    'zbl' => "Blissymbols; Blissymbolics; Bliss",
    'nob' => "Bokmål, Norwegian; Norwegian Bokmål",
    'bos' => "Bosnian",
    'bra' => "Braj",
    'bre' => "Breton",
    'bug' => "Buginese",
    'bul' => "Bulgarian",
    'bua' => "Buriat",
    'bur' => "Burmese",
    'cad' => "Caddo",
    'cat' => "Catalan; Valencian",
    'cau' => "Caucasian languages",
    'ceb' => "Cebuano",
    'cel' => "Celtic languages",
    'cai' => "Central American Indian languages",
    'khm' => "Central Khmer",
    'chg' => "Chagatai",
    'cmc' => "Chamic languages",
    'cha' => "Chamorro",
    'che' => "Chechen",
    'chr' => "Cherokee",
    'chy' => "Cheyenne",
    'chb' => "Chibcha",
    'nya' => "Chichewa; Chewa; Nyanja",
    'chi' => "Chinese",
    'chn' => "Chinook jargon",
    'chp' => "Chipewyan; Dene Suline",
    'cho' => "Choctaw",
    'chu' => "Church Slavic; Old Slavonic; Church Slavonic; Old Bulgarian; Old Church Slavonic",
    'chk' => "Chuukese",
    'chv' => "Chuvash",
    'nwc' => "Classical Newari; Old Newari; Classical Nepal Bhasa",
    'syc' => "Classical Syriac",
    'cop' => "Coptic",
    'cor' => "Cornish",
    'cos' => "Corsican",
    'cre' => "Cree",
    'mus' => "Creek",
    'crp' => "Creoles and pidgins",
    'cpe' => "Creoles and pidgins, English based",
    'cpf' => "Creoles and pidgins, French-based",
    'cpp' => "Creoles and pidgins, Portuguese-based",
    'crh' => "Crimean Tatar; Crimean Turkish",
    'hrv' => "Croatian",
    'cus' => "Cushitic languages",
    'cze' => "Czech",
    'dak' => "Dakota",
    'dan' => "Danish",
    'dar' => "Dargwa",
    'del' => "Delaware",
    'din' => "Dinka",
    'div' => "Divehi; Dhivehi; Maldivian",
    'doi' => "Dogri",
    'dgr' => "Dogrib",
    'dra' => "Dravidian languages",
    'dua' => "Duala",
    'dum' => "Dutch, Middle (ca.1050-1350)",
    'dut' => "Dutch; Flemish",
    'dyu' => "Dyula",
    'dzo' => "Dzongkha",
    'frs' => "Eastern Frisian",
    'efi' => "Efik",
    'egy' => "Egyptian (Ancient)",
    'eka' => "Ekajuk",
    'elx' => "Elamite",
    'eng' => "English",
    'enm' => "English, Middle (1100-1500)",
    'ang' => "English, Old (ca.450-1100)",
    'myv' => "Erzya",
    'epo' => "Esperanto",
    'est' => "Estonian",
    'ewe' => "Ewe",
    'ewo' => "Ewondo",
    'fan' => "Fang",
    'fat' => "Fanti",
    'fao' => "Faroese",
    'fij' => "Fijian",
    'fil' => "Filipino; Pilipino",
    'fin' => "Finnish",
    'fiu' => "Finno-Ugrian languages",
    'fon' => "Fon",
    'fre' => "French",
    'frm' => "French, Middle (ca.1400-1600)",
    'fro' => "French, Old (842-ca.1400)",
    'fur' => "Friulian",
    'ful' => "Fulah",
    'gaa' => "Ga",
    'gla' => "Gaelic; Scottish Gaelic",
    'car' => "Galibi Carib",
    'glg' => "Galician",
    'lug' => "Ganda",
    'gay' => "Gayo",
    'gba' => "Gbaya",
    'gez' => "Geez",
    'geo' => "Georgian",
    'ger' => "German",
    'gmh' => "German, Middle High (ca.1050-1500)",
    'goh' => "German, Old High (ca.750-1050)",
    'gem' => "Germanic languages",
    'gil' => "Gilbertese",
    'gon' => "Gondi",
    'gor' => "Gorontalo",
    'got' => "Gothic",
    'grb' => "Grebo",
    'grc' => "Greek, Ancient (to 1453)",
    'gre' => "Greek, Modern (1453-)",
    'grn' => "Guarani",
    'guj' => "Gujarati",
    'gwi' => "Gwich'in",
    'hai' => "Haida",
    'hat' => "Haitian; Haitian Creole",
    'hau' => "Hausa",
    'haw' => "Hawaiian",
    'heb' => "Hebrew",
    'her' => "Herero",
    'hil' => "Hiligaynon",
    'him' => "Himachali languages; Western Pahari languages",
    'hin' => "Hindi",
    'hmo' => "Hiri Motu",
    'hit' => "Hittite",
    'hmn' => "Hmong; Mong",
    'hun' => "Hungarian",
    'hup' => "Hupa",
    'iba' => "Iban",
    'ice' => "Icelandic",
    'ido' => "Ido",
    'ibo' => "Igbo",
    'ijo' => "Ijo languages",
    'ilo' => "Iloko",
    'smn' => "Inari Sami",
    'inc' => "Indic languages",
    'ine' => "Indo-European languages",
    'ind' => "Indonesian",
    'inh' => "Ingush",
    'ina' => "Interlingua (International Auxiliary Language Association)",
    'ile' => "Interlingue; Occidental",
    'iku' => "Inuktitut",
    'ipk' => "Inupiaq",
    'ira' => "Iranian languages",
    'gle' => "Irish",
    'mga' => "Irish, Middle (900-1200)",
    'sga' => "Irish, Old (to 900)",
    'iro' => "Iroquoian languages",
    'ita' => "Italian",
    'jpn' => "Japanese",
    'jav' => "Javanese",
    'jrb' => "Judeo-Arabic",
    'jpr' => "Judeo-Persian",
    'kbd' => "Kabardian",
    'kab' => "Kabyle",
    'kac' => "Kachin; Jingpho",
    'kal' => "Kalaallisut; Greenlandic",
    'xal' => "Kalmyk; Oirat",
    'kam' => "Kamba",
    'kan' => "Kannada",
    'kau' => "Kanuri",
    'kaa' => "Kara-Kalpak",
    'krc' => "Karachay-Balkar",
    'krl' => "Karelian",
    'kar' => "Karen languages",
    'kas' => "Kashmiri",
    'csb' => "Kashubian",
    'kaw' => "Kawi",
    'kaz' => "Kazakh",
    'kha' => "Khasi",
    'khi' => "Khoisan languages",
    'kho' => "Khotanese; Sakan",
    'kik' => "Kikuyu; Gikuyu",
    'kmb' => "Kimbundu",
    'kin' => "Kinyarwanda",
    'kir' => "Kirghiz; Kyrgyz",
    'tlh' => "Klingon; tlhIngan-Hol",
    'kom' => "Komi",
    'kon' => "Kongo",
    'kok' => "Konkani",
    'kor' => "Korean",
    'kos' => "Kosraean",
    'kpe' => "Kpelle",
    'kro' => "Kru languages",
    'kua' => "Kuanyama; Kwanyama",
    'kum' => "Kumyk",
    'kur' => "Kurdish",
    'kru' => "Kurukh",
    'kut' => "Kutenai",
    'lad' => "Ladino",
    'lah' => "Lahnda",
    'lam' => "Lamba",
    'day' => "Land Dayak languages",
    'lao' => "Lao",
    'lat' => "Latin",
    'lav' => "Latvian",
    'lez' => "Lezghian",
    'lim' => "Limburgan; Limburger; Limburgish",
    'lin' => "Lingala",
    'lit' => "Lithuanian",
    'jbo' => "Lojban",
    'nds' => "Low German; Low Saxon; German, Low; Saxon, Low",
    'dsb' => "Lower Sorbian",
    'loz' => "Lozi",
    'lub' => "Luba-Katanga",
    'lua' => "Luba-Lulua",
    'lui' => "Luiseno",
    'smj' => "Lule Sami",
    'lun' => "Lunda",
    'luo' => "Luo (Kenya and Tanzania)",
    'lus' => "Lushai",
    'ltz' => "Luxembourgish; Letzeburgesch",
    'mac' => "Macedonian",
    'mad' => "Madurese",
    'mag' => "Magahi",
    'mai' => "Maithili",
    'mak' => "Makasar",
    'mlg' => "Malagasy",
    'may' => "Malay",
    'mal' => "Malayalam",
    'mlt' => "Maltese",
    'mnc' => "Manchu",
    'mdr' => "Mandar",
    'man' => "Mandingo",
    'mni' => "Manipuri",
    'mno' => "Manobo languages",
    'glv' => "Manx",
    'mao' => "Maori",
    'arn' => "Mapudungun; Mapuche",
    'mar' => "Marathi",
    'chm' => "Mari",
    'mah' => "Marshallese",
    'mwr' => "Marwari",
    'mas' => "Masai",
    'myn' => "Mayan languages",
    'men' => "Mende",
    'mic' => "Mi'kmaq; Micmac",
    'min' => "Minangkabau",
    'mwl' => "Mirandese",
    'moh' => "Mohawk",
    'mdf' => "Moksha",
    'mkh' => "Mon-Khmer languages",
    'lol' => "Mongo",
    'mon' => "Mongolian",
    'mos' => "Mossi",
    'mul' => "Multiple languages",
    'mun' => "Munda languages",
    'nqo' => "N'Ko",
    'nah' => "Nahuatl languages",
    'nau' => "Nauru",
    'nav' => "Navajo; Navaho",
    'nde' => "Ndebele, North; North Ndebele",
    'nbl' => "Ndebele, South; South Ndebele",
    'ndo' => "Ndonga",
    'nap' => "Neapolitan",
    'new' => "Nepal Bhasa; Newari",
    'nep' => "Nepali",
    'nia' => "Nias",
    'nic' => "Niger-Kordofanian languages",
    'ssa' => "Nilo-Saharan languages",
    'niu' => "Niuean",
    'zxx' => "No linguistic content; Not applicable",
    'nog' => "Nogai",
    'non' => "Norse, Old",
    'nai' => "North American Indian languages",
    'frr' => "Northern Frisian",
    'sme' => "Northern Sami",
    'nor' => "Norwegian",
    'nno' => "Norwegian Nynorsk; Nynorsk, Norwegian",
    'nub' => "Nubian languages",
    'nym' => "Nyamwezi",
    'nyn' => "Nyankole",
    'nyo' => "Nyoro",
    'nzi' => "Nzima",
    'oci' => "Occitan (post 1500)",
    'arc' => "Official Aramaic (700-300 BCE); Imperial Aramaic (700-300 BCE)",
    'oji' => "Ojibwa",
    'ori' => "Oriya",
    'orm' => "Oromo",
    'osa' => "Osage",
    'oss' => "Ossetian; Ossetic",
    'oto' => "Otomian languages",
    'pal' => "Pahlavi",
    'pau' => "Palauan",
    'pli' => "Pali",
    'pam' => "Pampanga; Kapampangan",
    'pag' => "Pangasinan",
    'pan' => "Panjabi; Punjabi",
    'pap' => "Papiamento",
    'paa' => "Papuan languages",
    'nso' => "Pedi; Sepedi; Northern Sotho",
    'per' => "Persian",
    'peo' => "Persian, Old (ca.600-400 B.C.)",
    'phi' => "Philippine languages",
    'phn' => "Phoenician",
    'pon' => "Pohnpeian",
    'pol' => "Polish",
    'por' => "Portuguese",
    'pra' => "Prakrit languages",
    'pro' => "Provençal, Old (to 1500);Occitan, Old (to 1500)",
    'pus' => "Pushto; Pashto",
    'que' => "Quechua",
    'raj' => "Rajasthani",
    'rap' => "Rapanui",
    'rar' => "Rarotongan; Cook Islands Maori",
    'qaa-qtz' => "Reserved for local use",
    'roa' => "Romance languages",
    'rum' => "Romanian; Moldavian; Moldovan",
    'roh' => "Romansh",
    'rom' => "Romany",
    'run' => "Rundi",
    'rus' => "Russian",
    'sal' => "Salishan languages",
    'sam' => "Samaritan Aramaic",
    'smi' => "Sami languages",
    'smo' => "Samoan",
    'sad' => "Sandawe",
    'sag' => "Sango",
    'san' => "Sanskrit",
    'sat' => "Santali",
    'srd' => "Sardinian",
    'sas' => "Sasak",
    'sco' => "Scots",
    'sel' => "Selkup",
    'sem' => "Semitic languages",
    'srp' => "Serbian",
    'srr' => "Serer",
    'shn' => "Shan",
    'sna' => "Shona",
    'iii' => "Sichuan Yi; Nuosu",
    'scn' => "Sicilian",
    'sid' => "Sidamo",
    'sgn' => "Sign Languages",
    'bla' => "Siksika",
    'snd' => "Sindhi",
    'sin' => "Sinhala; Sinhalese",
    'sit' => "Sino-Tibetan languages",
    'sio' => "Siouan languages",
    'sms' => "Skolt Sami",
    'den' => "Slave (Athapascan)",
    'sla' => "Slavic languages",
    'slo' => "Slovak",
    'slv' => "Slovenian",
    'sog' => "Sogdian",
    'som' => "Somali",
    'son' => "Songhai languages",
    'snk' => "Soninke",
    'wen' => "Sorbian languages",
    'sot' => "Sotho, Southern",
    'sai' => "South American Indian languages",
    'alt' => "Southern Altai",
    'sma' => "Southern Sami",
    'spa' => "Spanish; Castilian",
    'srn' => "Sranan Tongo",
    'zgh' => "Standard Moroccan Tamazight",
    'suk' => "Sukuma",
    'sux' => "Sumerian",
    'sun' => "Sundanese",
    'sus' => "Susu",
    'swa' => "Swahili",
    'ssw' => "Swati",
    'swe' => "Swedish",
    'gsw' => "Swiss German; Alemannic; Alsatian",
    'syr' => "Syriac",
    'tgl' => "Tagalog",
    'tah' => "Tahitian",
    'tai' => "Tai languages",
    'tgk' => "Tajik",
    'tmh' => "Tamashek",
    'tam' => "Tamil",
    'tat' => "Tatar",
    'tel' => "Telugu",
    'ter' => "Tereno",
    'tet' => "Tetum",
    'tha' => "Thai",
    'tib' => "Tibetan",
    'tig' => "Tigre",
    'tir' => "Tigrinya",
    'tem' => "Timne",
    'tiv' => "Tiv",
    'tli' => "Tlingit",
    'tpi' => "Tok Pisin",
    'tkl' => "Tokelau",
    'tog' => "Tonga (Nyasa)",
    'ton' => "Tonga (Tonga Islands)",
    'tsi' => "Tsimshian",
    'tso' => "Tsonga",
    'tsn' => "Tswana",
    'tum' => "Tumbuka",
    'tup' => "Tupi languages",
    'tur' => "Turkish",
    'ota' => "Turkish, Ottoman (1500-1928)",
    'tuk' => "Turkmen",
    'tvl' => "Tuvalu",
    'tyv' => "Tuvinian",
    'twi' => "Twi",
    'udm' => "Udmurt",
    'uga' => "Ugaritic",
    'uig' => "Uighur; Uyghur",
    'ukr' => "Ukrainian",
    'umb' => "Umbundu",
    'mis' => "Uncoded languages",
    'und' => "Undetermined",
    'hsb' => "Upper Sorbian",
    'urd' => "Urdu",
    'uzb' => "Uzbek",
    'vai' => "Vai",
    'ven' => "Venda",
    'vie' => "Vietnamese",
    'vol' => "Volapük",
    'vot' => "Votic",
    'wak' => "Wakashan languages",
    'wln' => "Walloon",
    'war' => "Waray",
    'was' => "Washo",
    'wel' => "Welsh",
    'fry' => "Western Frisian",
    'wal' => "Wolaitta; Wolaytta",
    'wol' => "Wolof",
    'xho' => "Xhosa",
    'sah' => "Yakut",
    'yao' => "Yao",
    'yap' => "Yapese",
    'yid' => "Yiddish",
    'yor' => "Yoruba",
    'ypk' => "Yupik languages",
    'znd' => "Zande languages",
    'zap' => "Zapotec",
    'zza' => "Zaza; Dimili; Dimli; Kirdki; Kirmanjki; Zazaki",
    'zen' => "Zenaga",
    'zha' => "Zhuang; Chuang",
    'zul' => "Zulu",
    'zun' => "Zuni",
    );
    ?>