From cb944163a86192c15635df2e6004f090a019cb10 Mon Sep 17 00:00:00 2001 From: wr61 Date: Thu, 3 Mar 2005 13:03:11 +0000 Subject: generate languages from xml file git-svn-id: https://vdr-muggle.svn.sourceforge.net/svnroot/vdr-muggle/branches/0.1.3-wr@531 e10066b5-e1e2-0310-b819-94efdf66514b --- scripts/COPYRIGHT | 15 - scripts/gentables | 7 +- scripts/iso639tab.py | 29 +- scripts/iso_639.xml | 2072 +++++++++++++++++++++++++++++++++++++++++++++++++ scripts/languages.txt | 467 ----------- 5 files changed, 2102 insertions(+), 488 deletions(-) delete mode 100644 scripts/COPYRIGHT create mode 100644 scripts/iso_639.xml delete mode 100755 scripts/languages.txt (limited to 'scripts') diff --git a/scripts/COPYRIGHT b/scripts/COPYRIGHT deleted file mode 100644 index e41ca51..0000000 --- a/scripts/COPYRIGHT +++ /dev/null @@ -1,15 +0,0 @@ -# the content of languages.txt is generated by iso639tab.py from -# the file iso_639.xml. iso_639.xml contains this copyright note: -# -# -# -# -# -# -# -# -# -# -# -# -# diff --git a/scripts/gentables b/scripts/gentables index cdc97db..f7fcc89 100755 --- a/scripts/gentables +++ b/scripts/gentables @@ -16,9 +16,12 @@ echo '}; echo "lang_t languages[] = {" -cat scripts/languages.txt | while read iso name +scripts/iso639tab.py scripts/iso_639.xml | + grep -v '^#' | + grep -v '^$' | + while read iso1 iso2 iso3 name do - echo ' { "'$iso'", "'$name'" },' + echo ' { "'$iso2'", "'$name'" },' done echo '}; ' diff --git a/scripts/iso639tab.py b/scripts/iso639tab.py index d9d0b86..b2739c9 100755 --- a/scripts/iso639tab.py +++ b/scripts/iso639tab.py @@ -6,9 +6,6 @@ # Released under the GPL. # $Id: iso639tab.py,v 1.1 2005/03/02 07:24:51 mckinstry Exp $ -# modified by Wolfgang Rohdewald such that it only converts the -# iso-639-2 bibliography code and the name without comments - from xml.sax import saxutils, make_parser, saxlib, saxexts, ContentHandler from xml.sax.handler import feature_namespaces import sys, os, getopt, urllib2 @@ -37,7 +34,7 @@ class printLines(saxutils.DefaultHandler): short_code=short_code.encode('UTF-8') if type(name) == unicode: name = name.encode('UTF-8') - self.ofile.write (b_code + '\t' + name + '\n') + self.ofile.write (t_code + '\t' + b_code + '\t' + short_code + '\t' + name + '\n') ## @@ -46,6 +43,30 @@ class printLines(saxutils.DefaultHandler): ofile = sys.stdout +ofile.write(""" +## iso-639.tab +## +## Copyright (C) 2005 Alastair McKinstry +## Released under the GNU License; see file COPYING for details +## +## PLEASE NOTE: THIS FILE IS DEPRECATED AND SCHEDULED TO BE REMOVED. +## IT IS FOR BACKWARD-COMPATIBILITY ONLY: PLEASE USE THE ISO-639.XML +## FILE INSTEAD. +## +## This file gives a list of all languages in the ISO-639 +## standard, and is used to provide translations (via gettext) +## +## Status: ISO 639-2:1998 + additions and changes until 2003-03-05 +## Source: http://lcweb.loc.gov/standards/iso639-2/englangn.html +## +## Columns: +## iso-639-2 terminology code +## iso-639-2 bibliography code +## iso-639-1 code (XX if none exists) +## Name (English) +## +## +""") p = make_parser() p.setErrorHandler(saxutils.ErrorPrinter()) try: diff --git a/scripts/iso_639.xml b/scripts/iso_639.xml new file mode 100644 index 0000000..ed6fc73 --- /dev/null +++ b/scripts/iso_639.xml @@ -0,0 +1,2072 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff --git a/scripts/languages.txt b/scripts/languages.txt deleted file mode 100755 index 6378dcc..0000000 --- a/scripts/languages.txt +++ /dev/null @@ -1,467 +0,0 @@ -aar Afar -abk Abkhazian -ace Achinese -ach Acoli -ada Adangme -ady Adyghe; Adygei -afa Afro-Asiatic (Other) -afh Afrihili -afr Afrikaans -aka Akan -akk Akkadian -alb Albanian -amh Amharic -ang English, Old (ca.450-1100) -apa Apache languages -ara Arabic -arc Aramaic -arg Aragonese -arm Armenian -arn Araucanian -arp Arapaho -art Artificial (Other) -arw Arawak -asm Assamese -ast Asturian; Bable -ath Athapascan language -aus Australian languages -ava Avaric -ave Avestan -awa Awadhi -aym Aymara -aze Azerbaijani -bad Banda -bai Bamileke languages -bak Bashkir -bal Baluchi -bam Bambara -ban Balinese -baq Basque -bas Basa -bat Baltic (Other) -bej Beja -bel Belarusian -bem Bemba -ben Bengali -ber Berber (Other) -bho Bhojpuri -bih Bihari -bik Bikol -bin Bini -bis Bislama -bla Siksika -bnt Bantu (Other) -bos Bosnian -bra Braj -bre Breton -btk Batak (Indonesia) -bua Buriat -bug Buginese -bul Bulgarian -bur Burmese -byn Blin; Bilin -cad Caddo -cai Central American Indian (Other) -car Carib -cat Catalan -cau Caucasian (Other) -ceb Cebuano -cel Celtic (Other) -cha Chamorro -chb Chibcha -che Chechen -chg Chagatai -chi Chinese -chk Chukese -chm Mari -chn Chinook jargon -cho Choctaw -chp Chipewyan -chr Cherokee -chu Church Slavic -chv Chuvash -chy Cheyenne -cmc Chamic languages -cop Coptic -cor Cornish -cos Corsican -cpe English-based (Other) -cpf French-based (Other) -cpp Portuguese-based (Other) -cre Cree -crh Crimean Turkish; Crimean Tatar -crp Creoles and pidgins (Other) -csb Kashubian -cus Cushitic (Other) -cze Czech -dak Dakota -dan Danish -dar Dargwa -del Delaware -den Slave (Athapascan) -dgr Dogrib -din Dinka -div Divehi -doi Dogri -dra Dravidian (Other) -dsb Lower Sorbian -dua Duala -dum Dutch, Middle (ca. 1050-1350) -dut Dutch -dyu Dyula -dzo Dzongkha -efi Efik -egy Egyptian (Ancient) -eka Ekajuk -elx Elamite -eng English -enm English, Middle (1100-1500) -epo Esperanto -est Estonian -ewe Ewe -ewo Ewondo -fan Fang -fao Faroese -fat Fanti -fij Fijian -fil Filipino; Pilipino -fin Finnish -fiu Finno-Ugrian (Other) -fon Fon -fre French -frm French, Middle (ca.1400-1600) -fro French, Old (842-ca.1400) -fry Frisian -ful Fulah -fur Friulian -gaa Ga -gay Gayo -gba Gbaya -gem Germanic (Other) -geo Georgian -ger German -gez Geez -gil Gilbertese -gla Gaelic; Scottish -gle Irish -glg Gallegan -glv Manx -gmh German, Middle High (ca.1050-1500) -goh German, Old High (ca.750-1050) -gon Gondi -gor Gorontalo -got Gothic -grb Grebo -grc Greek, Ancient (to 1453) -gre Greek, Modern (1453-) -grn Guarani -guj Gujarati -gwi Gwichin -hai Haida -hat Haitian; Haitian Creole -hau Hausa -haw Hawaiian -heb Hebrew -her Herero -hil Hiligaynon -him Himachali -hin Hindi -hit Hittite -hmn Hmong -hmo Hiri -hsb Upper Sorbian -hun Hungarian -hup Hupa -iba Iban -ibo Igbo -ice Icelandic -ido Ido -iii Sichuan Yi -ijo Ijo -iku Inuktitut -ile Interlingue -ilo Iloko -ina Interlingua -inc Indic (Other) -ind Indonesian -ine Indo-European (Other) -inh Ingush -ipk Inupiaq -ira Iranian (Other) -iro Iroquoian languages -ita Italian -jav Javanese -jbo Lojban -jpn Japanese -jpr Judeo-Persian -jrb Judeo-Arabic -kaa Kara-Kalpak -kab Kabyle -kac Kachin -kal Greenlandic (Kalaallisut) -kam Kamba -kan Kannada -kar Karen -kas Kashmiri -kau Kanuri -kaw Kawi -kaz Kazakh -kbd Kabardian -kha Khazi -khi Khoisan (Other) -khm Khmer -kho Khotanese -kik Kikuyu -kin Kinyarwanda -kir Kirghiz -kmb Kimbundu -kok Konkani -kom Komi -kon Kongo -kor Korean -kos Kosraean -kpe Kpelle -krc Karachay-Balkar -kro Kru -kru Kurukh -kua Kuanyama -kum Kumyk -kur Kurdish -kut Kutenai -lad Ladino -lah Lahnda -lam Lamba -lao Lao -lat Latin -lav Latvian -lez Lezghian -lim Limburgian -lin Lingala -lit Lithuanian -lol Mongo -loz Lozi -ltz Luxembourgish -lua Luba-Lulua -lub Luba-Katanga -lug Ganda -lui Luiseno -lun Lunda -luo Luo (Kenya and Tanzania) -lus Lushai -mac Macedonian -mad Madurese -mag Magahi -mah Marshallese -mai Maithili -mak Makasar -mal Malayalam -man Mandingo -mao Maori -map Austronesian (Other) -mar Marathi -mas Masai -may Malay -mdf Moksha -mdr Mandar -men Mende -mga Irish, Middle (900-1200) -mic Mi'kmaq; Micmac -min Minangkabau -mis Miscellaneous languages -mkh Mon-Khmer (Other) -mlg Malagasy -mlt Maltese -mnc Manchu -mno Manobo languages -moh Mohawk -mol Moldavian -mon Mongolian -mos Mossi -mul Multiple languages -mun Munda languages -mus Creek -mwl Mirandese -mwr Marwari -myn Mayan languages -myv Erzya -nah Nahuatl -nai North American Indian (Other) -nap Neapolitan -nau Nauru -nav Navaho -nbl Ndebele, South -nde Ndebele, North -ndo Ndonga -nds German, Low -nep Nepali -new Newari -nia Nias -nic Niger-Kordofanian (Other) -niu Niuean -nno Norwegian Nynorsk -nob Bokmål, Norwegian -nog Nogai -non Norse, Old -nor Norwegian -nso Northern Sotho; Pedi; Sepedi -nub Nubian languages -nym Nyamwezi -nwc Classical Newari; Old Newari -nya Chewa; Chichewa; Nyanja -nyn Nyankole -nyo Nyoro -nzi Nzima -oci Occitan (post 1500) -oji Ojibwa -ori Oriya -orm Oromo -osa Osage -oss Ossetian -ota Turkish, Ottoman (1500-1928) -oto Otomian languages -paa Papuan (Other) -pag Pangasinan -pal Pahlavi -pam Pampanga -pan Punjabi -pap Papiamento -pau Palauan -peo Persian, Old (ca.600-400 B.C.) -per Persian -phi Philippine (Other) -phn Phoenician -pli Pali -pol Polish -por Portuguese -pon Pohnpeian -pra Prakrit languages -pro Provençal, Old (to 1500) -pus Pushto -que Quechua -raj Rajasthani -rap Rapanui -rar Rarotongan -roa Romance (Other) -roh Raeto-Romance -rom Romany -rum Romanian -run Rundi -rus Russian -sad Sandawe -sag Sango -sah Yakut -sai South American Indian (Other) -sal Salishan languages -sam Samaritan Aramaic -san Sanskrit -sas Sasak -sat Santali -scc Serbian -scn Sicilian -sco Scots -scr Croatian -sel Selkup -sem Semitic (Other) -sga Irish, Old (to 900) -sgn Sign languages -shn Shan -sid Sidamo -sin Sinhala; Sinhalese -sio Siouan languages -sit Sino-Tibetan (Other) -sla Slavic (Other) -slo Slovak -slv Slovenian -sma Southern Sami -sme Northern Sami -smi Sami languages (Other) -smj Lule Sami -smn Inari Sami -smo Samoan -sms Skolt Sami -sna Shona -snd Sindhi -snk Soninke -sog Sogdian -som Somali -son Songhai -sot Sotho, Southern -spa Spanish -srd Sardinian -srr Serer -ssa Nilo-Saharan (Other) -ssw Swati -suk Sukuma -sun Sundanese -sus Susu -sux Sumerian -swa Swahili -swe Swedish -syr Syriac -tah Tahitian -tai Tai (Other) -tam Tamil -tso Tsonga -tat Tatar -tel Telugu -tem Timne -ter Tereno -tet Tetum -tgk Tajik -tgl Tagalog -tha Thai -tib Tibetan -tig Tigre -tir Tigrinya -tiv Tiv -tlh Klingon; tlhIngan-Hol -tkl Tokelau -tli Tlinglit -tmh Tamashek -tog Tonga (Nyasa) -ton Tonga (Tonga Islands) -tpi Tok Pisin -tsi Tsimshian -tsn Tswana -tuk Turkmen -tum Tumbuka -tup Tupi languages -tur Turkish -tut Altaic (Other) -tvl Tuvalu -twi Twi -tyv Tuvinian -udm Udmurt -uga Ugaritic -uig Uighur -ukr Ukrainian -umb Umbundu -und Undetermined -urd Urdu -uzb Uzbek -vai Vai -ven Venda -vie Vietnamese -vol Volapuk -vot Votic -wak Wakashan languages -wal Walamo -war Waray -was Washo -wel Welsh -wen Sorbian languages -wln Walloon -wol Wolof -xal Kalmyk -xho Xhosa -yao Yao -yap Yapese -yid Yiddish -yor Yoruba -ypk Yupik languages -zap Zapotec -zen Zenaga -zha Chuang; Zhuang -znd Zande -zul Zulu -zun Zuni -- cgit v1.2.3