- Added comprehensive AI Assistant system (aiassist/ directory): * Vector search and embedding capabilities * Typebot proxy integration * Elastic search functionality * Message classification and chat history * MCP proxy for external integrations - Implemented Court Status API (GetCourtStatus.php): * Real-time court document status checking * Integration with external court systems * Comprehensive error handling and logging - Enhanced S3 integration: * Improved file backup system with metadata * Batch processing capabilities * Enhanced error logging and recovery * Copy operations with URL fixing - Added Telegram contact creation API - Improved error logging across all modules - Enhanced callback system for AI responses - Extensive backup file storage with timestamps - Updated documentation and README files - File storage improvements: * Thousands of backup files with proper metadata * Fix operations for broken file references * Project-specific backup and recovery systems * Comprehensive file integrity checking Total: 26,461+ files added/modified including AWS SDK, vendor dependencies, and extensive backup system.
514 lines
13 KiB
PHP
514 lines
13 KiB
PHP
<?php
|
|
|
|
/*
|
|
mPDF recognises IETF language tags as:
|
|
- a single primary language subtag composed of a two letter language code from ISO 639-1 (2002), or a three letter code from ISO 639-2 (1998), ISO 639-3 (2007) or ISO 639-5 (2008) (usually written in lower case);
|
|
- an optional script subtag, composed of a four letter script code from ISO 15924 (usually written in title case);
|
|
- an optional region subtag composed of a two letter country code from ISO 3166-1 alpha-2 (usually written in upper case), or a three digit code from UN M.49 for geographical regions;
|
|
Subtags are not case sensitive, but the specification recommends using the same case as in the Language Subtag Registry, where region subtags are uppercase, script subtags are titlecase and all other subtags are lowercase.
|
|
|
|
Region subtags are often deprecated by the registration of specific primary language subtags from ISO 639-3 which are now "preferred values". For example, "ar-DZ" is deprecated with the preferred value "arq" for Algerian Spoken Arabic;
|
|
|
|
Example: Serbian written in the Cyrillic (sr-Cyrl) or Latin (sr-Latn) script
|
|
|
|
und (for undetermined or undefined) is used in situations in which a script must be indicated but the language cannot be identified.
|
|
e.g. und-Cyrl is an undefined language written in Cyrillic script.
|
|
*/
|
|
|
|
function GetLangOpts($llcc, $adobeCJK, &$fontdata)
|
|
{
|
|
$tags = preg_split('/-/', $llcc);
|
|
$lang = strtolower($tags[0]);
|
|
$country = '';
|
|
$script = '';
|
|
if (isset($tags[1]) && $tags[1]) {
|
|
if (strlen($tags[1]) == 4) {
|
|
$script = strtolower($tags[1]);
|
|
} else {
|
|
$country = strtolower($tags[1]);
|
|
}
|
|
}
|
|
if (isset($tags[2]) && $tags[2]) {
|
|
$country = strtolower($tags[2]);
|
|
}
|
|
|
|
$unifont = "";
|
|
$coreSuitable = false;
|
|
|
|
switch ($lang) {
|
|
|
|
/* European */
|
|
CASE "en": CASE "eng": // English // LATIN
|
|
CASE "eu": CASE "eus": // Basque
|
|
CASE "br": CASE "bre": // Breton
|
|
CASE "ca": CASE "cat": // Catalan
|
|
CASE "co": CASE "cos": // Corsican
|
|
CASE "kw": CASE "cor": // Cornish
|
|
CASE "cy": CASE "cym": // Welsh
|
|
CASE "cs": CASE "ces": // Czech
|
|
CASE "da": CASE "dan": // Danish
|
|
CASE "nl": CASE "nld": // Dutch
|
|
CASE "et": CASE "est": // Estonian
|
|
CASE "fo": CASE "fao": // Faroese
|
|
CASE "fi": CASE "fin": // Finnish
|
|
CASE "fr": CASE "fra": // French
|
|
CASE "gl": CASE "glg": // Galician
|
|
CASE "de": CASE "deu": // German
|
|
CASE "ht": CASE "hat": // Haitian; Haitian Creole
|
|
CASE "hu": CASE "hun": // Hungarian
|
|
CASE "ga": CASE "gle": // Irish
|
|
CASE "is": CASE "isl": // Icelandic
|
|
CASE "it": CASE "ita": // Italian
|
|
CASE "la": CASE "lat": // Latin
|
|
CASE "lb": CASE "ltz": // Luxembourgish
|
|
CASE "li": CASE "lim": // Limburgish
|
|
CASE "lt": CASE "lit": // Lithuanian
|
|
CASE "lv": CASE "lav": // Latvian
|
|
CASE "gv": CASE "glv": // Manx
|
|
CASE "no": CASE "nor": // Norwegian
|
|
CASE "nn": CASE "nno": // Norwegian Nynorsk
|
|
CASE "nb": CASE "nob": // Norwegian Bokmål
|
|
CASE "pl": CASE "pol": // Polish
|
|
CASE "pt": CASE "por": // Portuguese
|
|
CASE "ro": CASE "ron": // Romanian
|
|
CASE "gd": CASE "gla": // Scottish Gaelic
|
|
CASE "es": CASE "spa": // Spanish
|
|
CASE "sv": CASE "swe": // Swedish
|
|
CASE "sl": CASE "slv": // Slovene
|
|
CASE "sk": CASE "slk": // Slovak
|
|
$unifont = "dejavusanscondensed";
|
|
// Edit this value to define how mPDF behaves when using new mPDF('-x')
|
|
// If set to TRUE, mPDF will use Adobe core fonts only when it recognises the languages above
|
|
$coreSuitable = true;
|
|
break;
|
|
|
|
CASE "ru": CASE "rus": // Russian // CYRILLIC
|
|
CASE "ab": CASE "abk": // Abkhaz
|
|
CASE "av": CASE "ava": // Avaric
|
|
CASE "ba": CASE "bak": // Bashkir
|
|
CASE "be": CASE "bel": // Belarusian
|
|
CASE "bg": CASE "bul": // Bulgarian
|
|
CASE "ce": CASE "che": // Chechen
|
|
CASE "cv": CASE "chv": // Chuvash
|
|
CASE "kk": CASE "kaz": // Kazakh
|
|
CASE "kv": CASE "kom": // Komi
|
|
CASE "ky": CASE "kir": // Kyrgyz
|
|
CASE "mk": CASE "mkd": // Macedonian
|
|
CASE "cu": CASE "chu": // Old Church Slavonic
|
|
CASE "os": CASE "oss": // Ossetian
|
|
CASE "sr": CASE "srp": // Serbian
|
|
CASE "tg": CASE "tgk": // Tajik
|
|
CASE "tt": CASE "tat": // Tatar
|
|
CASE "tk": CASE "tuk": // Turkmen
|
|
CASE "uk": CASE "ukr": // Ukrainian
|
|
$unifont = "dejavusanscondensed"; /* freeserif best coverage for supplements etc. */
|
|
break;
|
|
|
|
CASE "hy": CASE "hye": // ARMENIAN
|
|
$unifont = "dejavusans";
|
|
break;
|
|
CASE "ka": CASE "kat": // GEORGIAN
|
|
$unifont = "dejavusans";
|
|
break;
|
|
|
|
CASE "el": CASE "ell": // GREEK
|
|
$unifont = "dejavusanscondensed";
|
|
break;
|
|
CASE "cop": // COPTIC
|
|
$unifont = "quivira";
|
|
break;
|
|
|
|
CASE "got": // GOTHIC
|
|
$unifont = "freeserif";
|
|
break;
|
|
|
|
/* African */
|
|
CASE "nqo": // NKO
|
|
$unifont = "dejavusans";
|
|
break;
|
|
//CASE "bax": // BAMUM
|
|
//CASE "ha": CASE "hau": // Hausa
|
|
CASE "vai": // VAI
|
|
$unifont = "freesans";
|
|
break;
|
|
CASE "am": CASE "amh": // Amharic ETHIOPIC
|
|
CASE "ti": CASE "tir": // Tigrinya ETHIOPIC
|
|
$unifont = "abyssinicasil";
|
|
break;
|
|
|
|
|
|
|
|
/* Middle Eastern */
|
|
CASE "ar": CASE "ara": // Arabic NB Arabic text identified by Autofont will be marked as und-Arab
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "fa": CASE "fas": // Persian (Farsi)
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "ps": CASE "pus": // Pashto
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "ku": CASE "kur": // Kurdish
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "ur": CASE "urd": // Urdu
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "he": CASE "heb": // HEBREW
|
|
CASE "yi": CASE "yid": // Yiddish
|
|
$unifont = "taameydavidclm"; // dejavusans,dejavusanscondensed,freeserif are fine if you do not need cantillation marks
|
|
break;
|
|
|
|
|
|
CASE "syr": // SYRIAC
|
|
$unifont = "estrangeloedessa";
|
|
break;
|
|
|
|
|
|
//CASE "arc": // IMPERIAL_ARAMAIC
|
|
//CASE ""ae: // AVESTAN
|
|
CASE "xcr": // CARIAN
|
|
$unifont = "aegean";
|
|
break;
|
|
CASE "xlc": // LYCIAN
|
|
$unifont = "aegean";
|
|
break;
|
|
CASE "xld": // LYDIAN
|
|
$unifont = "aegean";
|
|
break;
|
|
//CASE "mid": // MANDAIC
|
|
//CASE "peo": // OLD_PERSIAN
|
|
CASE "phn": // PHOENICIAN
|
|
$unifont = "aegean";
|
|
break;
|
|
//CASE "smp": // SAMARITAN
|
|
CASE "uga": // UGARITIC
|
|
$unifont = "aegean";
|
|
break;
|
|
|
|
|
|
/* Central Asian */
|
|
CASE "bo": CASE "bod": // TIBETAN
|
|
CASE "dz": CASE "dzo": // Dzongkha
|
|
$unifont = "jomolhari";
|
|
break;
|
|
//CASE "mn": CASE "mon": // MONGOLIAN (Vertical script)
|
|
//CASE "ug": CASE "uig": // Uyghur
|
|
//CASE "uz": CASE "uzb": // Uzbek
|
|
//CASE "az": CASE "azb": // South Azerbaijani
|
|
|
|
|
|
/* South Asian */
|
|
CASE "as": CASE "asm": // Assamese
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "bn": CASE "ben": // BENGALI; Bangla
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "ks": CASE "kas": // Kashmiri
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "hi": CASE "hin": // Hindi DEVANAGARI
|
|
CASE "bh": CASE "bih": // Bihari (Bhojpuri, Magahi, and Maithili)
|
|
CASE "sa": CASE "san": // Sanskrit
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "gu": CASE "guj": // Gujarati
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "pa": CASE "pan": // Panjabi, Punjabi GURMUKHI
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "kn": CASE "kan": // Kannada
|
|
$unifont = "lohitkannada";
|
|
break;
|
|
CASE "mr": CASE "mar": // Marathi
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "ml": CASE "mal": // MALAYALAM
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "ne": CASE "nep": // Nepali
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "or": CASE "ori": // ORIYA
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "si": CASE "sin": // SINHALA
|
|
$unifont = "kaputaunicode";
|
|
break;
|
|
CASE "ta": CASE "tam": // TAMIL
|
|
$unifont = "freeserif";
|
|
break;
|
|
CASE "te": CASE "tel": // TELUGU
|
|
$unifont = "pothana2000";
|
|
break;
|
|
|
|
|
|
// Sindhi (Arabic or Devanagari)
|
|
CASE "sd": CASE "snd": // Sindhi
|
|
if ($country == "IN") {
|
|
$unifont = "freeserif";
|
|
} else if ($country == "PK") {
|
|
$unifont = "lateef";
|
|
} else {
|
|
$unifont = "lateef";
|
|
}
|
|
break;
|
|
|
|
|
|
//CASE "ccp": // CHAKMA
|
|
//CASE "lep": // LEPCHA
|
|
CASE "lif": // LIMBU
|
|
$unifont = "sun-exta";
|
|
break;
|
|
//CASE "sat": // OL_CHIKI
|
|
//CASE "saz": // SAURASHTRA
|
|
CASE "syl": // SYLOTI_NAGRI
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
//CASE "dgo": // TAKRI
|
|
CASE "dv": CASE "div": // Divehi; Maldivian THAANA
|
|
$unifont = "freeserif";
|
|
break;
|
|
|
|
|
|
|
|
/* South East Asian */
|
|
CASE "km": CASE "khm": // KHMER
|
|
$unifont = "khmeros";
|
|
break;
|
|
CASE "lo": CASE "lao": // LAO
|
|
$unifont = "dhyana";
|
|
break;
|
|
CASE "my": CASE "mya": // MYANMAR Burmese
|
|
$unifont = "tharlon"; // zawgyi-one is non-unicode compliant but in wide usage
|
|
// ayar is also not strictly compliant
|
|
// padaukbook is unicode compliant
|
|
break;
|
|
CASE "th": CASE "tha": // THAI
|
|
$unifont = "garuda";
|
|
break;
|
|
|
|
|
|
|
|
// VIETNAMESE
|
|
CASE "vi": CASE "vie": // Vietnamese
|
|
$unifont = "dejavusanscondensed";
|
|
break;
|
|
|
|
|
|
//CASE "ms": CASE "msa": // Malay
|
|
//CASE "ban": // BALINESE
|
|
//CASE "bya": // BATAK
|
|
CASE "bug": // BUGINESE
|
|
$unifont = "freeserif";
|
|
break;
|
|
//CASE "cjm": // CHAM
|
|
//CASE "jv": // JAVANESE
|
|
CASE "su": // SUNDANESE
|
|
$unifont = "sundaneseunicode";
|
|
break;
|
|
CASE "tdd": // TAI_LE
|
|
$unifont = "tharlon";
|
|
break;
|
|
CASE "blt": // TAI_VIET
|
|
$unifont = "taiheritagepro";
|
|
break;
|
|
|
|
|
|
/* Phillipine */
|
|
CASE "bku": // BUHID
|
|
$unifont = "quivira";
|
|
break;
|
|
CASE "hnn": // HANUNOO
|
|
$unifont = "quivira";
|
|
break;
|
|
CASE "tl": // TAGALOG
|
|
$unifont = "quivira";
|
|
break;
|
|
CASE "tbw": // TAGBANWA
|
|
$unifont = "quivira";
|
|
break;
|
|
|
|
|
|
/* East Asian */
|
|
CASE "zh": CASE "zho": // Chinese
|
|
if ($country == "HK" || $country == "TW") {
|
|
if ($adobeCJK) {
|
|
$unifont = "big5";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
} else if ($country == "CN") {
|
|
if ($adobeCJK) {
|
|
$unifont = "gb";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
} else {
|
|
if ($adobeCJK) {
|
|
$unifont = "gb";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
}
|
|
break;
|
|
CASE "ko": CASE "kor": // HANGUL Korean
|
|
if ($adobeCJK) {
|
|
$unifont = "uhc";
|
|
} else {
|
|
$unifont = "unbatang";
|
|
}
|
|
break;
|
|
CASE "ja": CASE "jpn": // Japanese HIRAGANA KATAKANA
|
|
if ($adobeCJK) {
|
|
$unifont = "sjis";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
break;
|
|
CASE "ii": CASE "iii": // Nuosu; Yi
|
|
if ($adobeCJK) {
|
|
$unifont = "gb";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
CASE "lis": // LISU
|
|
$unifont = "quivira";
|
|
break;
|
|
|
|
|
|
|
|
/* American */
|
|
CASE "chr": // CHEROKEE
|
|
CASE "oj": CASE "oji": // Ojibwe; Chippewa
|
|
CASE "cr": CASE "cre": // Cree CANADIAN_ABORIGINAL
|
|
CASE "iu": CASE "iku": // Inuktitut
|
|
$unifont = "aboriginalsans";
|
|
break;
|
|
|
|
|
|
/* Undetermined language - script used */
|
|
CASE "und":
|
|
|
|
switch ($script) {
|
|
|
|
/* European */
|
|
CASE "latn": // LATIN
|
|
$unifont = "dejavusanscondensed";
|
|
break;
|
|
CASE "cyrl": // CYRILLIC
|
|
$unifont = "dejavusanscondensed"; /* freeserif best coverage for supplements etc. */
|
|
break;
|
|
CASE "cprt": // CYPRIOT
|
|
$unifont = "aegean";
|
|
break;
|
|
CASE "glag": // GLAGOLITIC
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
CASE "linb": // LINEAR_B
|
|
$unifont = "aegean";
|
|
break;
|
|
CASE "ogam": // OGHAM
|
|
$unifont = "dejavusans";
|
|
break;
|
|
CASE "ital": // OLD_ITALIC
|
|
$unifont = "aegean";
|
|
break;
|
|
CASE "runr": // RUNIC
|
|
$unifont = "sun-exta";
|
|
break;
|
|
CASE "shaw": // SHAVIAN
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
|
|
/* African */
|
|
CASE "egyp": // EGYPTIAN_HIEROGLYPHS
|
|
$unifont = "aegyptus";
|
|
break;
|
|
CASE "ethi": // ETHIOPIC
|
|
$unifont = "abyssinicasil";
|
|
break;
|
|
//CASE "merc": // MEROITIC_CURSIVE
|
|
//CASE "mero": // MEROITIC_HIEROGLYPHS
|
|
CASE "osma": // OSMANYA
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
CASE "tfng": // TIFINAGH
|
|
$unifont = "dejavusans";
|
|
break;
|
|
|
|
/* Middle Eastern */
|
|
CASE "arab": // ARABIC
|
|
$unifont = "xbriyaz";
|
|
break;
|
|
CASE "xsux": // CUNEIFORM
|
|
$unifont = "akkadian";
|
|
break;
|
|
//CASE "sarb": // OLD_SOUTH_ARABIAN
|
|
//CASE "prti": // INSCRIPTIONAL_PARTHIAN
|
|
//CASE "phli": // INSCRIPTIONAL_PAHLAVI
|
|
|
|
|
|
/* Central Asian */
|
|
//CASE "orkh": // OLD_TURKIC
|
|
//CASE "phag": // PHAGS_PA (Vertical script)
|
|
|
|
/* South Asian */
|
|
//CASE "brah": // BRAHMI
|
|
//CASE "kthi": // KAITHI
|
|
CASE "khar": // KHAROSHTHI
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
CASE "mtei": // MEETEI_MAYEK
|
|
$unifont = "eeyekunicode";
|
|
break;
|
|
//CASE "shrd": // SHARADA
|
|
//CASE "sora": // SORA_SOMPENG
|
|
|
|
/* South East Asian */
|
|
CASE "kali": // KAYAH_LI
|
|
$unifont = "freemono";
|
|
break;
|
|
//CASE "rjng": // REJANG
|
|
CASE "lana": // TAI_THAM
|
|
$unifont = "lannaalif";
|
|
break;
|
|
CASE "talu": // NEW_TAI_LUE
|
|
$unifont = "daibannasilbook";
|
|
break;
|
|
|
|
/* East Asian */
|
|
CASE "hans": // HAN (SIMPLIFIED)
|
|
if ($adobeCJK) {
|
|
$unifont = "gb";
|
|
} else {
|
|
$unifont = "sun-exta";
|
|
}
|
|
break;
|
|
CASE "bopo": // BOPOMOFO
|
|
$unifont = "sun-exta";
|
|
break;
|
|
//CASE "plrd": // MIAO
|
|
CASE "yiii": // YI
|
|
$unifont = "sun-exta";
|
|
break;
|
|
|
|
/* American */
|
|
CASE "dsrt": // DESERET
|
|
$unifont = "mph2bdamase";
|
|
break;
|
|
|
|
/* Other */
|
|
CASE "brai": // BRAILLE
|
|
$unifont = "dejavusans";
|
|
break;
|
|
} // endswitch
|
|
break;
|
|
} // endswitch
|
|
|
|
|
|
return array($coreSuitable, $unifont);
|
|
}
|