spip_nursit/lib/mpdf/config_lang2fonts.php

514 lines
13 KiB
PHP
Raw Normal View History

2023-06-01 15:30:12 +00:00
<?php
/*
mPDF recognises IETF language tags as:
- a single primary language subtag composed of a two letter language code from ISO 639-1 (2002), or a three letter code from ISO 639-2 (1998), ISO 639-3 (2007) or ISO 639-5 (2008) (usually written in lower case);
- an optional script subtag, composed of a four letter script code from ISO 15924 (usually written in title case);
- an optional region subtag composed of a two letter country code from ISO 3166-1 alpha-2 (usually written in upper case), or a three digit code from UN M.49 for geographical regions;
Subtags are not case sensitive, but the specification recommends using the same case as in the Language Subtag Registry, where region subtags are uppercase, script subtags are titlecase and all other subtags are lowercase.
Region subtags are often deprecated by the registration of specific primary language subtags from ISO 639-3 which are now "preferred values". For example, "ar-DZ" is deprecated with the preferred value "arq" for Algerian Spoken Arabic;
Example: Serbian written in the Cyrillic (sr-Cyrl) or Latin (sr-Latn) script
und (for undetermined or undefined) is used in situations in which a script must be indicated but the language cannot be identified.
e.g. und-Cyrl is an undefined language written in Cyrillic script.
*/
function GetLangOpts($llcc, $adobeCJK, &$fontdata)
{
$tags = preg_split('/-/', $llcc);
$lang = strtolower($tags[0]);
$country = '';
$script = '';
if (isset($tags[1]) && $tags[1]) {
if (strlen($tags[1]) == 4) {
$script = strtolower($tags[1]);
} else {
$country = strtolower($tags[1]);
}
}
if (isset($tags[2]) && $tags[2]) {
$country = strtolower($tags[2]);
}
$unifont = "";
$coreSuitable = false;
switch ($lang) {
/* European */
CASE "en": CASE "eng": // English // LATIN
CASE "eu": CASE "eus": // Basque
CASE "br": CASE "bre": // Breton
CASE "ca": CASE "cat": // Catalan
CASE "co": CASE "cos": // Corsican
CASE "kw": CASE "cor": // Cornish
CASE "cy": CASE "cym": // Welsh
CASE "cs": CASE "ces": // Czech
CASE "da": CASE "dan": // Danish
CASE "nl": CASE "nld": // Dutch
CASE "et": CASE "est": // Estonian
CASE "fo": CASE "fao": // Faroese
CASE "fi": CASE "fin": // Finnish
CASE "fr": CASE "fra": // French
CASE "gl": CASE "glg": // Galician
CASE "de": CASE "deu": // German
CASE "ht": CASE "hat": // Haitian; Haitian Creole
CASE "hu": CASE "hun": // Hungarian
CASE "ga": CASE "gle": // Irish
CASE "is": CASE "isl": // Icelandic
CASE "it": CASE "ita": // Italian
CASE "la": CASE "lat": // Latin
CASE "lb": CASE "ltz": // Luxembourgish
CASE "li": CASE "lim": // Limburgish
CASE "lt": CASE "lit": // Lithuanian
CASE "lv": CASE "lav": // Latvian
CASE "gv": CASE "glv": // Manx
CASE "no": CASE "nor": // Norwegian
CASE "nn": CASE "nno": // Norwegian Nynorsk
CASE "nb": CASE "nob": // Norwegian Bokmål
CASE "pl": CASE "pol": // Polish
CASE "pt": CASE "por": // Portuguese
CASE "ro": CASE "ron": // Romanian
CASE "gd": CASE "gla": // Scottish Gaelic
CASE "es": CASE "spa": // Spanish
CASE "sv": CASE "swe": // Swedish
CASE "sl": CASE "slv": // Slovene
CASE "sk": CASE "slk": // Slovak
$unifont = "dejavusanscondensed";
// Edit this value to define how mPDF behaves when using new mPDF('-x')
// If set to TRUE, mPDF will use Adobe core fonts only when it recognises the languages above
$coreSuitable = true;
break;
CASE "ru": CASE "rus": // Russian // CYRILLIC
CASE "ab": CASE "abk": // Abkhaz
CASE "av": CASE "ava": // Avaric
CASE "ba": CASE "bak": // Bashkir
CASE "be": CASE "bel": // Belarusian
CASE "bg": CASE "bul": // Bulgarian
CASE "ce": CASE "che": // Chechen
CASE "cv": CASE "chv": // Chuvash
CASE "kk": CASE "kaz": // Kazakh
CASE "kv": CASE "kom": // Komi
CASE "ky": CASE "kir": // Kyrgyz
CASE "mk": CASE "mkd": // Macedonian
CASE "cu": CASE "chu": // Old Church Slavonic
CASE "os": CASE "oss": // Ossetian
CASE "sr": CASE "srp": // Serbian
CASE "tg": CASE "tgk": // Tajik
CASE "tt": CASE "tat": // Tatar
CASE "tk": CASE "tuk": // Turkmen
CASE "uk": CASE "ukr": // Ukrainian
$unifont = "dejavusanscondensed"; /* freeserif best coverage for supplements etc. */
break;
CASE "hy": CASE "hye": // ARMENIAN
$unifont = "dejavusans";
break;
CASE "ka": CASE "kat": // GEORGIAN
$unifont = "dejavusans";
break;
CASE "el": CASE "ell": // GREEK
$unifont = "dejavusanscondensed";
break;
CASE "cop": // COPTIC
$unifont = "quivira";
break;
CASE "got": // GOTHIC
$unifont = "freeserif";
break;
/* African */
CASE "nqo": // NKO
$unifont = "dejavusans";
break;
//CASE "bax": // BAMUM
//CASE "ha": CASE "hau": // Hausa
CASE "vai": // VAI
$unifont = "freesans";
break;
CASE "am": CASE "amh": // Amharic ETHIOPIC
CASE "ti": CASE "tir": // Tigrinya ETHIOPIC
$unifont = "abyssinicasil";
break;
/* Middle Eastern */
CASE "ar": CASE "ara": // Arabic NB Arabic text identified by Autofont will be marked as und-Arab
$unifont = "xbriyaz";
break;
CASE "fa": CASE "fas": // Persian (Farsi)
$unifont = "xbriyaz";
break;
CASE "ps": CASE "pus": // Pashto
$unifont = "xbriyaz";
break;
CASE "ku": CASE "kur": // Kurdish
$unifont = "xbriyaz";
break;
CASE "ur": CASE "urd": // Urdu
$unifont = "xbriyaz";
break;
CASE "he": CASE "heb": // HEBREW
CASE "yi": CASE "yid": // Yiddish
$unifont = "taameydavidclm"; // dejavusans,dejavusanscondensed,freeserif are fine if you do not need cantillation marks
break;
CASE "syr": // SYRIAC
$unifont = "estrangeloedessa";
break;
//CASE "arc": // IMPERIAL_ARAMAIC
//CASE ""ae: // AVESTAN
CASE "xcr": // CARIAN
$unifont = "aegean";
break;
CASE "xlc": // LYCIAN
$unifont = "aegean";
break;
CASE "xld": // LYDIAN
$unifont = "aegean";
break;
//CASE "mid": // MANDAIC
//CASE "peo": // OLD_PERSIAN
CASE "phn": // PHOENICIAN
$unifont = "aegean";
break;
//CASE "smp": // SAMARITAN
CASE "uga": // UGARITIC
$unifont = "aegean";
break;
/* Central Asian */
CASE "bo": CASE "bod": // TIBETAN
CASE "dz": CASE "dzo": // Dzongkha
$unifont = "jomolhari";
break;
//CASE "mn": CASE "mon": // MONGOLIAN (Vertical script)
//CASE "ug": CASE "uig": // Uyghur
//CASE "uz": CASE "uzb": // Uzbek
//CASE "az": CASE "azb": // South Azerbaijani
/* South Asian */
CASE "as": CASE "asm": // Assamese
$unifont = "freeserif";
break;
CASE "bn": CASE "ben": // BENGALI; Bangla
$unifont = "freeserif";
break;
CASE "ks": CASE "kas": // Kashmiri
$unifont = "freeserif";
break;
CASE "hi": CASE "hin": // Hindi DEVANAGARI
CASE "bh": CASE "bih": // Bihari (Bhojpuri, Magahi, and Maithili)
CASE "sa": CASE "san": // Sanskrit
$unifont = "freeserif";
break;
CASE "gu": CASE "guj": // Gujarati
$unifont = "freeserif";
break;
CASE "pa": CASE "pan": // Panjabi, Punjabi GURMUKHI
$unifont = "freeserif";
break;
CASE "kn": CASE "kan": // Kannada
$unifont = "lohitkannada";
break;
CASE "mr": CASE "mar": // Marathi
$unifont = "freeserif";
break;
CASE "ml": CASE "mal": // MALAYALAM
$unifont = "freeserif";
break;
CASE "ne": CASE "nep": // Nepali
$unifont = "freeserif";
break;
CASE "or": CASE "ori": // ORIYA
$unifont = "freeserif";
break;
CASE "si": CASE "sin": // SINHALA
$unifont = "kaputaunicode";
break;
CASE "ta": CASE "tam": // TAMIL
$unifont = "freeserif";
break;
CASE "te": CASE "tel": // TELUGU
$unifont = "pothana2000";
break;
// Sindhi (Arabic or Devanagari)
CASE "sd": CASE "snd": // Sindhi
if ($country == "IN") {
$unifont = "freeserif";
} else if ($country == "PK") {
$unifont = "lateef";
} else {
$unifont = "lateef";
}
break;
//CASE "ccp": // CHAKMA
//CASE "lep": // LEPCHA
CASE "lif": // LIMBU
$unifont = "sun-exta";
break;
//CASE "sat": // OL_CHIKI
//CASE "saz": // SAURASHTRA
CASE "syl": // SYLOTI_NAGRI
$unifont = "mph2bdamase";
break;
//CASE "dgo": // TAKRI
CASE "dv": CASE "div": // Divehi; Maldivian THAANA
$unifont = "freeserif";
break;
/* South East Asian */
CASE "km": CASE "khm": // KHMER
$unifont = "khmeros";
break;
CASE "lo": CASE "lao": // LAO
$unifont = "dhyana";
break;
CASE "my": CASE "mya": // MYANMAR Burmese
$unifont = "tharlon"; // zawgyi-one is non-unicode compliant but in wide usage
// ayar is also not strictly compliant
// padaukbook is unicode compliant
break;
CASE "th": CASE "tha": // THAI
$unifont = "garuda";
break;
// VIETNAMESE
CASE "vi": CASE "vie": // Vietnamese
$unifont = "dejavusanscondensed";
break;
//CASE "ms": CASE "msa": // Malay
//CASE "ban": // BALINESE
//CASE "bya": // BATAK
CASE "bug": // BUGINESE
$unifont = "freeserif";
break;
//CASE "cjm": // CHAM
//CASE "jv": // JAVANESE
CASE "su": // SUNDANESE
$unifont = "sundaneseunicode";
break;
CASE "tdd": // TAI_LE
$unifont = "tharlon";
break;
CASE "blt": // TAI_VIET
$unifont = "taiheritagepro";
break;
/* Phillipine */
CASE "bku": // BUHID
$unifont = "quivira";
break;
CASE "hnn": // HANUNOO
$unifont = "quivira";
break;
CASE "tl": // TAGALOG
$unifont = "quivira";
break;
CASE "tbw": // TAGBANWA
$unifont = "quivira";
break;
/* East Asian */
CASE "zh": CASE "zho": // Chinese
if ($country == "HK" || $country == "TW") {
if ($adobeCJK) {
$unifont = "big5";
} else {
$unifont = "sun-exta";
}
} else if ($country == "CN") {
if ($adobeCJK) {
$unifont = "gb";
} else {
$unifont = "sun-exta";
}
} else {
if ($adobeCJK) {
$unifont = "gb";
} else {
$unifont = "sun-exta";
}
}
break;
CASE "ko": CASE "kor": // HANGUL Korean
if ($adobeCJK) {
$unifont = "uhc";
} else {
$unifont = "unbatang";
}
break;
CASE "ja": CASE "jpn": // Japanese HIRAGANA KATAKANA
if ($adobeCJK) {
$unifont = "sjis";
} else {
$unifont = "sun-exta";
}
break;
CASE "ii": CASE "iii": // Nuosu; Yi
if ($adobeCJK) {
$unifont = "gb";
} else {
$unifont = "sun-exta";
}
CASE "lis": // LISU
$unifont = "quivira";
break;
/* American */
CASE "chr": // CHEROKEE
CASE "oj": CASE "oji": // Ojibwe; Chippewa
CASE "cr": CASE "cre": // Cree CANADIAN_ABORIGINAL
CASE "iu": CASE "iku": // Inuktitut
$unifont = "aboriginalsans";
break;
/* Undetermined language - script used */
CASE "und":
switch ($script) {
/* European */
CASE "latn": // LATIN
$unifont = "dejavusanscondensed";
break;
CASE "cyrl": // CYRILLIC
$unifont = "dejavusanscondensed"; /* freeserif best coverage for supplements etc. */
break;
CASE "cprt": // CYPRIOT
$unifont = "aegean";
break;
CASE "glag": // GLAGOLITIC
$unifont = "mph2bdamase";
break;
CASE "linb": // LINEAR_B
$unifont = "aegean";
break;
CASE "ogam": // OGHAM
$unifont = "dejavusans";
break;
CASE "ital": // OLD_ITALIC
$unifont = "aegean";
break;
CASE "runr": // RUNIC
$unifont = "sun-exta";
break;
CASE "shaw": // SHAVIAN
$unifont = "mph2bdamase";
break;
/* African */
CASE "egyp": // EGYPTIAN_HIEROGLYPHS
$unifont = "aegyptus";
break;
CASE "ethi": // ETHIOPIC
$unifont = "abyssinicasil";
break;
//CASE "merc": // MEROITIC_CURSIVE
//CASE "mero": // MEROITIC_HIEROGLYPHS
CASE "osma": // OSMANYA
$unifont = "mph2bdamase";
break;
CASE "tfng": // TIFINAGH
$unifont = "dejavusans";
break;
/* Middle Eastern */
CASE "arab": // ARABIC
$unifont = "xbriyaz";
break;
CASE "xsux": // CUNEIFORM
$unifont = "akkadian";
break;
//CASE "sarb": // OLD_SOUTH_ARABIAN
//CASE "prti": // INSCRIPTIONAL_PARTHIAN
//CASE "phli": // INSCRIPTIONAL_PAHLAVI
/* Central Asian */
//CASE "orkh": // OLD_TURKIC
//CASE "phag": // PHAGS_PA (Vertical script)
/* South Asian */
//CASE "brah": // BRAHMI
//CASE "kthi": // KAITHI
CASE "khar": // KHAROSHTHI
$unifont = "mph2bdamase";
break;
CASE "mtei": // MEETEI_MAYEK
$unifont = "eeyekunicode";
break;
//CASE "shrd": // SHARADA
//CASE "sora": // SORA_SOMPENG
/* South East Asian */
CASE "kali": // KAYAH_LI
$unifont = "freemono";
break;
//CASE "rjng": // REJANG
CASE "lana": // TAI_THAM
$unifont = "lannaalif";
break;
CASE "talu": // NEW_TAI_LUE
$unifont = "daibannasilbook";
break;
/* East Asian */
CASE "hans": // HAN (SIMPLIFIED)
if ($adobeCJK) {
$unifont = "gb";
} else {
$unifont = "sun-exta";
}
break;
CASE "bopo": // BOPOMOFO
$unifont = "sun-exta";
break;
//CASE "plrd": // MIAO
CASE "yiii": // YI
$unifont = "sun-exta";
break;
/* American */
CASE "dsrt": // DESERET
$unifont = "mph2bdamase";
break;
/* Other */
CASE "brai": // BRAILLE
$unifont = "dejavusans";
break;
} // endswitch
break;
} // endswitch
return array($coreSuitable, $unifont);
}