Source

Locale.js

  1. /*
  2. * Locale.js - Locale specifier definition
  3. *
  4. * Copyright © 2012-2015, 2018,2021 JEDLSoft
  5. *
  6. * Licensed under the Apache License, Version 2.0 (the "License");
  7. * you may not use this file except in compliance with the License.
  8. * You may obtain a copy of the License at
  9. *
  10. * http://www.apache.org/licenses/LICENSE-2.0
  11. *
  12. * Unless required by applicable law or agreed to in writing, software
  13. * distributed under the License is distributed on an "AS IS" BASIS,
  14. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. *
  16. * See the License for the specific language governing permissions and
  17. * limitations under the License.
  18. */
  19. var ilib = require("./ilib.js");
  20. var JSUtils = require("./JSUtils.js");
  21. /**
  22. * @class
  23. * Create a new locale instance. Locales are specified either with a specifier string
  24. * that follows the BCP-47 convention (roughly: "language-region-script-variant") or
  25. * with 4 parameters that specify the language, region, variant, and script individually.<p>
  26. *
  27. * The language is given as an ISO 639-1 two-letter, lower-case language code. You
  28. * can find a full list of these codes at
  29. * <a href="http://en.wikipedia.org/wiki/List_of_ISO_639-1_codes">http://en.wikipedia.org/wiki/List_of_ISO_639-1_codes</a><p>
  30. *
  31. * The region is given as an ISO 3166-1 two-letter, upper-case region code. You can
  32. * find a full list of these codes at
  33. * <a href="http://en.wikipedia.org/wiki/ISO_3166-1_alpha-2">http://en.wikipedia.org/wiki/ISO_3166-1_alpha-2</a>.<p>
  34. *
  35. * The variant is any string that does not contain a dash which further differentiates
  36. * locales from each other.<p>
  37. *
  38. * The script is given as the ISO 15924 four-letter script code. In some locales,
  39. * text may be validly written in more than one script. For example, Serbian is often
  40. * written in both Latin and Cyrillic, though not usually mixed together. You can find a
  41. * full list of these codes at
  42. * <a href="http://en.wikipedia.org/wiki/ISO_15924#List_of_codes">http://en.wikipedia.org/wiki/ISO_15924#List_of_codes</a>.<p>
  43. *
  44. * As an example in ilib, the script can be used in the date formatter. Dates formatted
  45. * in Serbian could have day-of-week names or month names written in the Latin
  46. * or Cyrillic script. Often one script is default such that sr-SR-Latn is the same
  47. * as sr-SR so the script code "Latn" can be left off of the locale spec.<p>
  48. *
  49. * Each part is optional, and an empty string in the specifier before or after a
  50. * dash or as a parameter to the constructor denotes an unspecified value. In this
  51. * case, many of the ilib functions will treat the locale as generic. For example
  52. * the locale "en-" is equivalent to "en" and to "en--" and denotes a locale
  53. * of "English" with an unspecified region and variant, which typically matches
  54. * any region or variant.<p>
  55. *
  56. * Without any arguments to the constructor, this function returns the locale of
  57. * the host Javascript engine.<p>
  58. *
  59. *
  60. * @constructor
  61. * @param {?string|Locale=} language the ISO 639 2-letter code for the language, or a full
  62. * locale spec in BCP-47 format, or another Locale instance to copy from
  63. * @param {string=} region the ISO 3166 2-letter code for the region
  64. * @param {string=} variant the name of the variant of this locale, if any
  65. * @param {string=} script the ISO 15924 code of the script for this locale, if any
  66. */
  67. var Locale = function(language, region, variant, script) {
  68. if (typeof(region) === 'undefined' && typeof(variant) === 'undefined' && typeof(script) === 'undefined') {
  69. var spec = language || ilib.getLocale();
  70. if (typeof(spec) === 'string') {
  71. var parts = spec.split(/[-_]/g);
  72. for ( var i = 0; i < parts.length; i++ ) {
  73. if (Locale._isLanguageCode(parts[i])) {
  74. /**
  75. * @private
  76. * @type {string|undefined}
  77. */
  78. this.language = parts[i];
  79. } else if (Locale._isRegionCode(parts[i])) {
  80. /**
  81. * @private
  82. * @type {string|undefined}
  83. */
  84. this.region = parts[i];
  85. } else if (Locale._isScriptCode(parts[i])) {
  86. /**
  87. * @private
  88. * @type {string|undefined}
  89. */
  90. this.script = parts[i];
  91. } else {
  92. /**
  93. * @private
  94. * @type {string|undefined}
  95. */
  96. this.variant = parts[i];
  97. }
  98. }
  99. this.language = this.language || undefined;
  100. this.region = this.region || undefined;
  101. this.script = this.script || undefined;
  102. this.variant = this.variant || undefined;
  103. } else if (typeof(spec) === 'object') {
  104. this.language = spec.language || undefined;
  105. this.region = spec.region || undefined;
  106. this.script = spec.script || undefined;
  107. this.variant = spec.variant || undefined;
  108. }
  109. } else {
  110. if (language && typeof(language) === "string") {
  111. language = language.trim();
  112. this.language = language.length > 0 ? language.toLowerCase() : undefined;
  113. } else {
  114. this.language = undefined;
  115. }
  116. if (region && typeof(region) === "string") {
  117. region = region.trim();
  118. this.region = region.length > 0 ? region.toUpperCase() : undefined;
  119. } else {
  120. this.region = undefined;
  121. }
  122. if (variant && typeof(variant) === "string") {
  123. variant = variant.trim();
  124. this.variant = variant.length > 0 ? variant : undefined;
  125. } else {
  126. this.variant = undefined;
  127. }
  128. if (script && typeof(script) === "string") {
  129. script = script.trim();
  130. this.script = script.length > 0 ? script : undefined;
  131. } else {
  132. this.script = undefined;
  133. }
  134. }
  135. this._genSpec();
  136. };
  137. // from http://en.wikipedia.org/wiki/ISO_3166-1
  138. Locale.a2toa3regmap = {
  139. "AF": "AFG",
  140. "AX": "ALA",
  141. "AL": "ALB",
  142. "DZ": "DZA",
  143. "AS": "ASM",
  144. "AD": "AND",
  145. "AO": "AGO",
  146. "AI": "AIA",
  147. "AQ": "ATA",
  148. "AG": "ATG",
  149. "AR": "ARG",
  150. "AM": "ARM",
  151. "AW": "ABW",
  152. "AU": "AUS",
  153. "AT": "AUT",
  154. "AZ": "AZE",
  155. "BS": "BHS",
  156. "BH": "BHR",
  157. "BD": "BGD",
  158. "BB": "BRB",
  159. "BY": "BLR",
  160. "BE": "BEL",
  161. "BZ": "BLZ",
  162. "BJ": "BEN",
  163. "BM": "BMU",
  164. "BT": "BTN",
  165. "BO": "BOL",
  166. "BQ": "BES",
  167. "BA": "BIH",
  168. "BW": "BWA",
  169. "BV": "BVT",
  170. "BR": "BRA",
  171. "IO": "IOT",
  172. "BN": "BRN",
  173. "BG": "BGR",
  174. "BF": "BFA",
  175. "BI": "BDI",
  176. "KH": "KHM",
  177. "CM": "CMR",
  178. "CA": "CAN",
  179. "CV": "CPV",
  180. "KY": "CYM",
  181. "CF": "CAF",
  182. "TD": "TCD",
  183. "CL": "CHL",
  184. "CN": "CHN",
  185. "CX": "CXR",
  186. "CC": "CCK",
  187. "CO": "COL",
  188. "KM": "COM",
  189. "CG": "COG",
  190. "CD": "COD",
  191. "CK": "COK",
  192. "CR": "CRI",
  193. "CI": "CIV",
  194. "HR": "HRV",
  195. "CU": "CUB",
  196. "CW": "CUW",
  197. "CY": "CYP",
  198. "CZ": "CZE",
  199. "DK": "DNK",
  200. "DJ": "DJI",
  201. "DM": "DMA",
  202. "DO": "DOM",
  203. "EC": "ECU",
  204. "EG": "EGY",
  205. "SV": "SLV",
  206. "GQ": "GNQ",
  207. "ER": "ERI",
  208. "EE": "EST",
  209. "ET": "ETH",
  210. "FK": "FLK",
  211. "FO": "FRO",
  212. "FJ": "FJI",
  213. "FI": "FIN",
  214. "FR": "FRA",
  215. "GF": "GUF",
  216. "PF": "PYF",
  217. "TF": "ATF",
  218. "GA": "GAB",
  219. "GM": "GMB",
  220. "GE": "GEO",
  221. "DE": "DEU",
  222. "GH": "GHA",
  223. "GI": "GIB",
  224. "GR": "GRC",
  225. "GL": "GRL",
  226. "GD": "GRD",
  227. "GP": "GLP",
  228. "GU": "GUM",
  229. "GT": "GTM",
  230. "GG": "GGY",
  231. "GN": "GIN",
  232. "GW": "GNB",
  233. "GY": "GUY",
  234. "HT": "HTI",
  235. "HM": "HMD",
  236. "VA": "VAT",
  237. "HN": "HND",
  238. "HK": "HKG",
  239. "HU": "HUN",
  240. "IS": "ISL",
  241. "IN": "IND",
  242. "ID": "IDN",
  243. "IR": "IRN",
  244. "IQ": "IRQ",
  245. "IE": "IRL",
  246. "IM": "IMN",
  247. "IL": "ISR",
  248. "IT": "ITA",
  249. "JM": "JAM",
  250. "JP": "JPN",
  251. "JE": "JEY",
  252. "JO": "JOR",
  253. "KZ": "KAZ",
  254. "KE": "KEN",
  255. "KI": "KIR",
  256. "KP": "PRK",
  257. "KR": "KOR",
  258. "KW": "KWT",
  259. "KG": "KGZ",
  260. "LA": "LAO",
  261. "LV": "LVA",
  262. "LB": "LBN",
  263. "LS": "LSO",
  264. "LR": "LBR",
  265. "LY": "LBY",
  266. "LI": "LIE",
  267. "LT": "LTU",
  268. "LU": "LUX",
  269. "MO": "MAC",
  270. "MK": "MKD",
  271. "MG": "MDG",
  272. "MW": "MWI",
  273. "MY": "MYS",
  274. "MV": "MDV",
  275. "ML": "MLI",
  276. "MT": "MLT",
  277. "MH": "MHL",
  278. "MQ": "MTQ",
  279. "MR": "MRT",
  280. "MU": "MUS",
  281. "YT": "MYT",
  282. "MX": "MEX",
  283. "FM": "FSM",
  284. "MD": "MDA",
  285. "MC": "MCO",
  286. "MN": "MNG",
  287. "ME": "MNE",
  288. "MS": "MSR",
  289. "MA": "MAR",
  290. "MZ": "MOZ",
  291. "MM": "MMR",
  292. "NA": "NAM",
  293. "NR": "NRU",
  294. "NP": "NPL",
  295. "NL": "NLD",
  296. "NC": "NCL",
  297. "NZ": "NZL",
  298. "NI": "NIC",
  299. "NE": "NER",
  300. "NG": "NGA",
  301. "NU": "NIU",
  302. "NF": "NFK",
  303. "MP": "MNP",
  304. "NO": "NOR",
  305. "OM": "OMN",
  306. "PK": "PAK",
  307. "PW": "PLW",
  308. "PS": "PSE",
  309. "PA": "PAN",
  310. "PG": "PNG",
  311. "PY": "PRY",
  312. "PE": "PER",
  313. "PH": "PHL",
  314. "PN": "PCN",
  315. "PL": "POL",
  316. "PT": "PRT",
  317. "PR": "PRI",
  318. "QA": "QAT",
  319. "RE": "REU",
  320. "RO": "ROU",
  321. "RU": "RUS",
  322. "RW": "RWA",
  323. "BL": "BLM",
  324. "SH": "SHN",
  325. "KN": "KNA",
  326. "LC": "LCA",
  327. "MF": "MAF",
  328. "PM": "SPM",
  329. "VC": "VCT",
  330. "WS": "WSM",
  331. "SM": "SMR",
  332. "ST": "STP",
  333. "SA": "SAU",
  334. "SN": "SEN",
  335. "RS": "SRB",
  336. "SC": "SYC",
  337. "SL": "SLE",
  338. "SG": "SGP",
  339. "SX": "SXM",
  340. "SK": "SVK",
  341. "SI": "SVN",
  342. "SB": "SLB",
  343. "SO": "SOM",
  344. "ZA": "ZAF",
  345. "GS": "SGS",
  346. "SS": "SSD",
  347. "ES": "ESP",
  348. "LK": "LKA",
  349. "SD": "SDN",
  350. "SR": "SUR",
  351. "SJ": "SJM",
  352. "SZ": "SWZ",
  353. "SE": "SWE",
  354. "CH": "CHE",
  355. "SY": "SYR",
  356. "TW": "TWN",
  357. "TJ": "TJK",
  358. "TZ": "TZA",
  359. "TH": "THA",
  360. "TL": "TLS",
  361. "TG": "TGO",
  362. "TK": "TKL",
  363. "TO": "TON",
  364. "TT": "TTO",
  365. "TN": "TUN",
  366. "TR": "TUR",
  367. "TM": "TKM",
  368. "TC": "TCA",
  369. "TV": "TUV",
  370. "UG": "UGA",
  371. "UA": "UKR",
  372. "AE": "ARE",
  373. "GB": "GBR",
  374. "US": "USA",
  375. "UM": "UMI",
  376. "UY": "URY",
  377. "UZ": "UZB",
  378. "VU": "VUT",
  379. "VE": "VEN",
  380. "VN": "VNM",
  381. "VG": "VGB",
  382. "VI": "VIR",
  383. "WF": "WLF",
  384. "EH": "ESH",
  385. "YE": "YEM",
  386. "ZM": "ZMB",
  387. "ZW": "ZWE"
  388. };
  389. Locale.a1toa3langmap = {
  390. "ab": "abk",
  391. "aa": "aar",
  392. "af": "afr",
  393. "ak": "aka",
  394. "sq": "sqi",
  395. "am": "amh",
  396. "ar": "ara",
  397. "an": "arg",
  398. "hy": "hye",
  399. "as": "asm",
  400. "av": "ava",
  401. "ae": "ave",
  402. "ay": "aym",
  403. "az": "aze",
  404. "bm": "bam",
  405. "ba": "bak",
  406. "eu": "eus",
  407. "be": "bel",
  408. "bn": "ben",
  409. "bh": "bih",
  410. "bi": "bis",
  411. "bs": "bos",
  412. "br": "bre",
  413. "bg": "bul",
  414. "my": "mya",
  415. "ca": "cat",
  416. "ch": "cha",
  417. "ce": "che",
  418. "ny": "nya",
  419. "zh": "zho",
  420. "cv": "chv",
  421. "kw": "cor",
  422. "co": "cos",
  423. "cr": "cre",
  424. "hr": "hrv",
  425. "cs": "ces",
  426. "da": "dan",
  427. "dv": "div",
  428. "nl": "nld",
  429. "dz": "dzo",
  430. "en": "eng",
  431. "eo": "epo",
  432. "et": "est",
  433. "ee": "ewe",
  434. "fo": "fao",
  435. "fj": "fij",
  436. "fi": "fin",
  437. "fr": "fra",
  438. "ff": "ful",
  439. "gl": "glg",
  440. "ka": "kat",
  441. "de": "deu",
  442. "el": "ell",
  443. "gn": "grn",
  444. "gu": "guj",
  445. "ht": "hat",
  446. "ha": "hau",
  447. "he": "heb",
  448. "hz": "her",
  449. "hi": "hin",
  450. "ho": "hmo",
  451. "hu": "hun",
  452. "ia": "ina",
  453. "id": "ind",
  454. "ie": "ile",
  455. "ga": "gle",
  456. "ig": "ibo",
  457. "ik": "ipk",
  458. "io": "ido",
  459. "is": "isl",
  460. "it": "ita",
  461. "iu": "iku",
  462. "ja": "jpn",
  463. "jv": "jav",
  464. "kl": "kal",
  465. "kn": "kan",
  466. "kr": "kau",
  467. "ks": "kas",
  468. "kk": "kaz",
  469. "km": "khm",
  470. "ki": "kik",
  471. "rw": "kin",
  472. "ky": "kir",
  473. "kv": "kom",
  474. "kg": "kon",
  475. "ko": "kor",
  476. "ku": "kur",
  477. "kj": "kua",
  478. "la": "lat",
  479. "lb": "ltz",
  480. "lg": "lug",
  481. "li": "lim",
  482. "ln": "lin",
  483. "lo": "lao",
  484. "lt": "lit",
  485. "lu": "lub",
  486. "lv": "lav",
  487. "gv": "glv",
  488. "mk": "mkd",
  489. "mg": "mlg",
  490. "ms": "msa",
  491. "ml": "mal",
  492. "mt": "mlt",
  493. "mi": "mri",
  494. "mr": "mar",
  495. "mh": "mah",
  496. "mn": "mon",
  497. "na": "nau",
  498. "nv": "nav",
  499. "nb": "nob",
  500. "nd": "nde",
  501. "ne": "nep",
  502. "ng": "ndo",
  503. "nn": "nno",
  504. "no": "nor",
  505. "ii": "iii",
  506. "nr": "nbl",
  507. "oc": "oci",
  508. "oj": "oji",
  509. "cu": "chu",
  510. "om": "orm",
  511. "or": "ori",
  512. "os": "oss",
  513. "pa": "pan",
  514. "pi": "pli",
  515. "fa": "fas",
  516. "pl": "pol",
  517. "ps": "pus",
  518. "pt": "por",
  519. "qu": "que",
  520. "rm": "roh",
  521. "rn": "run",
  522. "ro": "ron",
  523. "ru": "rus",
  524. "sa": "san",
  525. "sc": "srd",
  526. "sd": "snd",
  527. "se": "sme",
  528. "sm": "smo",
  529. "sg": "sag",
  530. "sr": "srp",
  531. "gd": "gla",
  532. "sn": "sna",
  533. "si": "sin",
  534. "sk": "slk",
  535. "sl": "slv",
  536. "so": "som",
  537. "st": "sot",
  538. "es": "spa",
  539. "su": "sun",
  540. "sw": "swa",
  541. "ss": "ssw",
  542. "sv": "swe",
  543. "ta": "tam",
  544. "te": "tel",
  545. "tg": "tgk",
  546. "th": "tha",
  547. "ti": "tir",
  548. "bo": "bod",
  549. "tk": "tuk",
  550. "tl": "tgl",
  551. "tn": "tsn",
  552. "to": "ton",
  553. "tr": "tur",
  554. "ts": "tso",
  555. "tt": "tat",
  556. "tw": "twi",
  557. "ty": "tah",
  558. "ug": "uig",
  559. "uk": "ukr",
  560. "ur": "urd",
  561. "uz": "uzb",
  562. "ve": "ven",
  563. "vi": "vie",
  564. "vo": "vol",
  565. "wa": "wln",
  566. "cy": "cym",
  567. "wo": "wol",
  568. "fy": "fry",
  569. "xh": "xho",
  570. "yi": "yid",
  571. "yo": "yor",
  572. "za": "zha",
  573. "zu": "zul"
  574. };
  575. // the list below is originally from https://unicode.org/iso15924/iso15924-codes.html
  576. Locale.iso15924 = [
  577. "Adlm",
  578. "Afak",
  579. "Aghb",
  580. "Ahom",
  581. "Arab",
  582. "Aran",
  583. "Armi",
  584. "Armn",
  585. "Avst",
  586. "Bali",
  587. "Bamu",
  588. "Bass",
  589. "Batk",
  590. "Beng",
  591. "Bhks",
  592. "Blis",
  593. "Bopo",
  594. "Brah",
  595. "Brai",
  596. "Bugi",
  597. "Buhd",
  598. "Cakm",
  599. "Cans",
  600. "Cari",
  601. "Cham",
  602. "Cher",
  603. "Chrs",
  604. "Cirt",
  605. "Copt",
  606. "Cpmn",
  607. "Cprt",
  608. "Cyrl",
  609. "Cyrs",
  610. "Deva",
  611. "Diak",
  612. "Dogr",
  613. "Dsrt",
  614. "Dupl",
  615. "Egyd",
  616. "Egyh",
  617. "Egyp",
  618. "Elba",
  619. "Elym",
  620. "Ethi",
  621. "Geok",
  622. "Geor",
  623. "Glag",
  624. "Gong",
  625. "Gonm",
  626. "Goth",
  627. "Gran",
  628. "Grek",
  629. "Gujr",
  630. "Guru",
  631. "Hanb",
  632. "Hang",
  633. "Hani",
  634. "Hano",
  635. "Hans",
  636. "Hant",
  637. "Hatr",
  638. "Hebr",
  639. "Hira",
  640. "Hluw",
  641. "Hmng",
  642. "Hmnp",
  643. "Hrkt",
  644. "Hung",
  645. "Inds",
  646. "Ital",
  647. "Jamo",
  648. "Java",
  649. "Jpan",
  650. "Jurc",
  651. "Kali",
  652. "Kana",
  653. "Khar",
  654. "Khmr",
  655. "Khoj",
  656. "Kitl",
  657. "Kits",
  658. "Knda",
  659. "Kore",
  660. "Kpel",
  661. "Kthi",
  662. "Lana",
  663. "Laoo",
  664. "Latf",
  665. "Latg",
  666. "Latn",
  667. "Leke",
  668. "Lepc",
  669. "Limb",
  670. "Lina",
  671. "Linb",
  672. "Lisu",
  673. "Loma",
  674. "Lyci",
  675. "Lydi",
  676. "Mahj",
  677. "Maka",
  678. "Mand",
  679. "Mani",
  680. "Marc",
  681. "Maya",
  682. "Medf",
  683. "Mend",
  684. "Merc",
  685. "Mero",
  686. "Mlym",
  687. "Modi",
  688. "Mong",
  689. "Moon",
  690. "Mroo",
  691. "Mtei",
  692. "Mult",
  693. "Mymr",
  694. "Nand",
  695. "Narb",
  696. "Nbat",
  697. "Newa",
  698. "Nkdb",
  699. "Nkgb",
  700. "Nkoo",
  701. "Nshu",
  702. "Ogam",
  703. "Olck",
  704. "Orkh",
  705. "Orya",
  706. "Osge",
  707. "Osma",
  708. "Palm",
  709. "Pauc",
  710. "Perm",
  711. "Phag",
  712. "Phli",
  713. "Phlp",
  714. "Phlv",
  715. "Phnx",
  716. "Plrd",
  717. "Piqd",
  718. "Prti",
  719. "Qaaa",
  720. "Qabx",
  721. "Rjng",
  722. "Rohg",
  723. "Roro",
  724. "Runr",
  725. "Samr",
  726. "Sara",
  727. "Sarb",
  728. "Saur",
  729. "Sgnw",
  730. "Shaw",
  731. "Shrd",
  732. "Shui",
  733. "Sidd",
  734. "Sind",
  735. "Sinh",
  736. "Sogd",
  737. "Sogo",
  738. "Sora",
  739. "Soyo",
  740. "Sund",
  741. "Sylo",
  742. "Syrc",
  743. "Syre",
  744. "Syrj",
  745. "Syrn",
  746. "Tagb",
  747. "Takr",
  748. "Tale",
  749. "Talu",
  750. "Taml",
  751. "Tang",
  752. "Tavt",
  753. "Telu",
  754. "Teng",
  755. "Tfng",
  756. "Tglg",
  757. "Thaa",
  758. "Thai",
  759. "Tibt",
  760. "Tirh",
  761. "Toto",
  762. "Ugar",
  763. "Vaii",
  764. "Visp",
  765. "Wara",
  766. "Wcho",
  767. "Wole",
  768. "Xpeo",
  769. "Xsux",
  770. "Yezi",
  771. "Yiii",
  772. "Zanb",
  773. "Zinh",
  774. "Zmth",
  775. "Zsye",
  776. "Zsym",
  777. "Zxxx",
  778. "Zyyy",
  779. "Zzzz",
  780. ];
  781. /**
  782. * Tell whether or not the str does not start with a lower case ASCII char.
  783. * @private
  784. * @param {string} str the char to check
  785. * @return {boolean} true if the char is not a lower case ASCII char
  786. */
  787. Locale._notLower = function(str) {
  788. // do this with ASCII only so we don't have to depend on the CType functions
  789. var ch = str.charCodeAt(0);
  790. return ch < 97 || ch > 122;
  791. };
  792. /**
  793. * Tell whether or not the str does not start with an upper case ASCII char.
  794. * @private
  795. * @param {string} str the char to check
  796. * @return {boolean} true if the char is a not an upper case ASCII char
  797. */
  798. Locale._notUpper = function(str) {
  799. // do this with ASCII only so we don't have to depend on the CType functions
  800. var ch = str.charCodeAt(0);
  801. return ch < 65 || ch > 90;
  802. };
  803. /**
  804. * Tell whether or not the str does not start with a digit char.
  805. * @private
  806. * @param {string} str the char to check
  807. * @return {boolean} true if the char is a not an upper case ASCII char
  808. */
  809. Locale._notDigit = function(str) {
  810. // do this with ASCII only so we don't have to depend on the CType functions
  811. var ch = str.charCodeAt(0);
  812. return ch < 48 || ch > 57;
  813. };
  814. /**
  815. * Tell whether or not the given string has the correct syntax to be
  816. * an ISO 639 language code.
  817. *
  818. * @private
  819. * @param {string} str the string to parse
  820. * @return {boolean} true if the string could syntactically be a language code.
  821. */
  822. Locale._isLanguageCode = function(str) {
  823. if (typeof(str) === 'undefined' || str.length < 2 || str.length > 3) {
  824. return false;
  825. }
  826. for (var i = 0; i < str.length; i++) {
  827. if (Locale._notLower(str.charAt(i))) {
  828. return false;
  829. }
  830. }
  831. return true;
  832. };
  833. /**
  834. * Tell whether or not the given string has the correct syntax to be
  835. * an ISO 3166 2-letter region code or M.49 3-digit region code.
  836. *
  837. * @private
  838. * @param {string} str the string to parse
  839. * @return {boolean} true if the string could syntactically be a language code.
  840. */
  841. Locale._isRegionCode = function (str) {
  842. var i;
  843. if (typeof(str) === 'undefined' || str.length < 2 || str.length > 3) {
  844. return false;
  845. }
  846. if (str.length === 2) {
  847. for (i = 0; i < str.length; i++) {
  848. if (Locale._notUpper(str.charAt(i))) {
  849. return false;
  850. }
  851. }
  852. } else {
  853. for (i = 0; i < str.length; i++) {
  854. if (Locale._notDigit(str.charAt(i))) {
  855. return false;
  856. }
  857. }
  858. }
  859. return true;
  860. };
  861. /**
  862. * Tell whether or not the given string has the correct syntax to be
  863. * an ISO 639 language code.
  864. *
  865. * @private
  866. * @param {string} str the string to parse
  867. * @return {boolean} true if the string could syntactically be a language code.
  868. */
  869. Locale._isScriptCode = function(str) {
  870. if (typeof(str) === 'undefined' || str.length !== 4 || Locale._notUpper(str.charAt(0))) {
  871. return false;
  872. }
  873. for (var i = 1; i < 4; i++) {
  874. if (Locale._notLower(str.charAt(i))) {
  875. return false;
  876. }
  877. }
  878. return true;
  879. };
  880. /**
  881. * Return the ISO-3166 alpha3 equivalent region code for the given ISO 3166 alpha2
  882. * region code. If the given alpha2 code is not found, this function returns its
  883. * argument unchanged.
  884. * @static
  885. * @param {string|undefined} alpha2 the alpha2 code to map
  886. * @return {string|undefined} the alpha3 equivalent of the given alpha2 code, or the alpha2
  887. * parameter if the alpha2 value is not found
  888. */
  889. Locale.regionAlpha2ToAlpha3 = function(alpha2) {
  890. return Locale.a2toa3regmap[alpha2] || alpha2;
  891. };
  892. /**
  893. * Return the ISO-639 alpha3 equivalent language code for the given ISO 639 alpha1
  894. * language code. If the given alpha1 code is not found, this function returns its
  895. * argument unchanged.
  896. * @static
  897. * @param {string|undefined} alpha1 the alpha1 code to map
  898. * @return {string|undefined} the alpha3 equivalent of the given alpha1 code, or the alpha1
  899. * parameter if the alpha1 value is not found
  900. */
  901. Locale.languageAlpha1ToAlpha3 = function(alpha1) {
  902. return Locale.a1toa3langmap[alpha1] || alpha1;
  903. };
  904. Locale.prototype = {
  905. /**
  906. * @private
  907. */
  908. _genSpec: function () {
  909. this.spec = this.language || "";
  910. if (this.script) {
  911. if (this.spec.length > 0) {
  912. this.spec += "-";
  913. }
  914. this.spec += this.script;
  915. }
  916. if (this.region) {
  917. if (this.spec.length > 0) {
  918. this.spec += "-";
  919. }
  920. this.spec += this.region;
  921. }
  922. if (this.variant) {
  923. if (this.spec.length > 0) {
  924. this.spec += "-";
  925. }
  926. this.spec += this.variant;
  927. }
  928. },
  929. /**
  930. * Return the ISO 639 language code for this locale.
  931. * @return {string|undefined} the language code for this locale
  932. */
  933. getLanguage: function() {
  934. return this.language;
  935. },
  936. /**
  937. * Return the language of this locale as an ISO-639-alpha3 language code
  938. * @return {string|undefined} the alpha3 language code of this locale
  939. */
  940. getLanguageAlpha3: function() {
  941. return Locale.languageAlpha1ToAlpha3(this.language);
  942. },
  943. /**
  944. * Return the ISO 3166 region code for this locale.
  945. * @return {string|undefined} the region code of this locale
  946. */
  947. getRegion: function() {
  948. return this.region;
  949. },
  950. /**
  951. * Return the region of this locale as an ISO-3166-alpha3 region code
  952. * @return {string|undefined} the alpha3 region code of this locale
  953. */
  954. getRegionAlpha3: function() {
  955. return Locale.regionAlpha2ToAlpha3(this.region);
  956. },
  957. /**
  958. * Return the ISO 15924 script code for this locale
  959. * @return {string|undefined} the script code of this locale
  960. */
  961. getScript: function () {
  962. return this.script;
  963. },
  964. /**
  965. * Return the variant code for this locale
  966. * @return {string|undefined} the variant code of this locale, if any
  967. */
  968. getVariant: function() {
  969. return this.variant;
  970. },
  971. /**
  972. * Return the whole locale specifier as a string.
  973. * @return {string} the locale specifier
  974. */
  975. getSpec: function() {
  976. if (!this.spec) this._genSpec();
  977. return this.spec;
  978. },
  979. /**
  980. * Return the language locale specifier. This includes the
  981. * language and the script if it is available. This can be
  982. * used to see whether the written language of two locales
  983. * match each other regardless of the region or variant.
  984. *
  985. * @return {string} the language locale specifier
  986. */
  987. getLangSpec: function() {
  988. var spec = this.language;
  989. if (spec && this.script) {
  990. spec += "-" + this.script;
  991. }
  992. return spec || "";
  993. },
  994. /**
  995. * Express this locale object as a string. Currently, this simply calls the getSpec
  996. * function to represent the locale as its specifier.
  997. *
  998. * @return {string} the locale specifier
  999. */
  1000. toString: function() {
  1001. return this.getSpec();
  1002. },
  1003. /**
  1004. * Return true if the the other locale is exactly equal to the current one.
  1005. * @return {boolean} whether or not the other locale is equal to the current one
  1006. */
  1007. equals: function(other) {
  1008. return this.language === other.language &&
  1009. this.region === other.region &&
  1010. this.script === other.script &&
  1011. this.variant === other.variant;
  1012. },
  1013. /**
  1014. * Return true if the current locale is the special pseudo locale.
  1015. * @return {boolean} true if the current locale is the special pseudo locale
  1016. */
  1017. isPseudo: function () {
  1018. return JSUtils.indexOf(ilib.pseudoLocales, this.spec) > -1;
  1019. },
  1020. /**
  1021. * Return true if the current locale uses a valid ISO codes for each component
  1022. * of the locale that exists.
  1023. * @return {boolean} true if the current locale has all valid components, and
  1024. * false otherwise.
  1025. */
  1026. isValid: function() {
  1027. if (!this.language && !this.script && !this.region) return false;
  1028. return !!((!this.language || (Locale._isLanguageCode(this.language) && Locale.a1toa3langmap[this.language])) &&
  1029. (!this.script || (Locale._isScriptCode(this.script) && Locale.iso15924.indexOf(this.script) > -1)) &&
  1030. (!this.region || (Locale._isRegionCode(this.region) && Locale.a2toa3regmap[this.region])));
  1031. }
  1032. };
  1033. // static functions
  1034. /**
  1035. * @private
  1036. */
  1037. Locale.locales = [];
  1038. // !macro localelist
  1039. /**
  1040. * Return the list of available locales that this iLib file supports.
  1041. * If this copy of ilib is pre-assembled with locale data, then the
  1042. * list locales may be much smaller
  1043. * than the list of all available locales in the iLib repository. The
  1044. * assembly tool will automatically fill in the list for an assembled
  1045. * copy of iLib. If this copy is being used with dynamically loaded
  1046. * data, then you
  1047. * can load any locale that iLib supports. You can form a locale with any
  1048. * combination of a language and region tags that exist in the locale
  1049. * data directory. Language tags are in the root of the locale data dir,
  1050. * and region tags can be found underneath the "und" directory. (The
  1051. * region tags are separated into a different dir because the region names
  1052. * conflict with language names on file systems that are case-insensitive.)
  1053. * If you have culled the locale data directory to limit the size of
  1054. * your app, then this function should return only those files that actually exist
  1055. * according to the ilibmanifest.json file in the root of that locale
  1056. * data dir. Make sure your ilibmanifest.json file is up-to-date with
  1057. * respect to the list of files that exist in the locale data dir.
  1058. *
  1059. * @param {boolean} sync if false, load the list of available files from disk
  1060. * asynchronously, otherwise load them synchronously. (Default: true/synchronously)
  1061. * @param {Function} onLoad a callback function to call if asynchronous
  1062. * load was requested and the list of files have been loaded.
  1063. * @return {Array.<string>} this is an array of locale specs for which
  1064. * this iLib file has locale data for
  1065. */
  1066. Locale.getAvailableLocales = function (sync, onLoad) {
  1067. var locales = [];
  1068. if (Locale.locales.length || typeof(ilib._load.listAvailableFiles) !== 'function') {
  1069. locales = Locale.locales;
  1070. if (onLoad && typeof(onLoad) === 'function') {
  1071. onLoad(locales);
  1072. }
  1073. } else {
  1074. if (typeof(sync) === 'undefined') {
  1075. sync = true;
  1076. }
  1077. ilib._load.listAvailableFiles(sync, function(manifest) {
  1078. if (manifest) {
  1079. for (var dir in manifest) {
  1080. var filelist = manifest[dir];
  1081. for (var i = 0; i < filelist.length; i++) {
  1082. if (filelist[i].length > 15 && filelist[i].substr(-15) === "localeinfo.json") {
  1083. locales.push(filelist[i].substring(0,filelist[i].length-16).replace(/\//g, "-"));
  1084. }
  1085. }
  1086. }
  1087. }
  1088. if (onLoad && typeof(onLoad) === 'function') {
  1089. onLoad(locales);
  1090. }
  1091. });
  1092. }
  1093. return locales;
  1094. };
  1095. module.exports = Locale;