Jump to content
Wikipedia The Free Encyclopedia

Module:Lang/data/is latn data

From Wikipedia, the free encyclopedia
Module documentation[view] [edit] [history] [purge]
Warning This Lua module is used on approximately 1,650,000 pages, or roughly 3% of all pages .
To avoid major disruption and server load, any changes should be tested in the module's /sandbox or /testcases subpages, or in your own module sandbox. The tested changes can be added to this page in a single edit. Consider discussing changes on the talk page before implementing them.

Usage

{{#invoke:Lang/data/is latn data|function_name}}

The above documentation is transcluded from Module:Lang/data/is latn data/doc. (edit | history)
Editors can experiment in this module's sandbox (create | mirror) and testcases (create) pages.
Subpages of this module.

 --[[--------------------------< S I N G L E S _ T >-----------------------------------------------------------

 list of Latn and Zyyy (common) codepoints that are not included in <ranges_t> taken from Module:Unicode data/scripts
 and a local copy of https://www.unicode.org/Public/16.0.0/ucd/ScriptExtensions.txt

 ]]

 localsingles_t={
 [170]=true,-- 00AA
 [186]=true,-- 00BA
 [215]=true,-- 00D7
 [247]=true,-- 00F7
 [787]=true,-- 0313
 [800]=true,-- 0320
 [856]=true,-- 0358
 [862]=true,-- 035E
 [884]=true,-- 0374
 [894]=true,-- 037E
 [901]=true,-- 0385
 [903]=true,-- 0387
 [1541]=true,-- 0605
 [1548]=true,-- 060C
 [1563]=true,-- 061B
 [1567]=true,-- 061F
 [1600]=true,-- 0640
 [1757]=true,-- 06DD
 [2274]=true,-- 08E2
 [3647]=true,-- 0E3F
 [4347]=true,-- 10FB
 [6149]=true,-- 1805
 [7379]=true,-- 1CD3
 [7393]=true,-- 1CE1
 [7418]=true,-- 1CFA
 [7672]=true,-- 1DF8
 [8305]=true,-- 2071
 [8319]=true,-- 207F
 [8432]=true,-- 20F0
 [8498]=true,-- 2132
 [8526]=true,-- 214E
 [12294]=true,-- 3006
 [12448]=true,-- 30A0
 [12783]=true,-- 31EF
 [13055]=true,-- 32FF
 [42963]=true,-- A7D3
 [43310]=true,-- A92E
 [43471]=true,-- A9CF
 [43867]=true,-- AB5B
 [65279]=true,-- FEFF
 [65392]=true,-- FF70
 [119970]=true,-- 1D4A2
 [119995]=true,-- 1D4BB
 [120134]=true,-- 1D546
 [129008]=true,-- 1F7F0
 [917505]=true,-- E0001
 }


 --[[--------------------------< R A N G E S _ T >-------------------------------------------------------------

 list of Latn and Zyyy (common) codepoints taken from Module:Unicode data/scripts and a local copy of
 https://www.unicode.org/Public/16.0.0/ucd/ScriptExtensions.txt

 ]]

 localranges_t={
 {0,169},-- 0000..00A9
 {171,185},-- 00AB..00B9
 {187,214},-- 00BB..00D6
 {216,246},-- 00D8..00F6
 {248,745},-- 00F8..02E9
 {748,782},-- 02EC..030E
 {784,785},-- 0310..0311
 {803,805},-- 0323..0325
 {813,814},-- 032D..032E
 {816,817},-- 0330..0331
 {867,879},-- 0363..036F
 {1157,1158},-- 0485..0486
 {2385,2386},-- 0951..0952
 {2404,2405},-- 0964..0965
 {4053,4056},-- 0FD5..0FD8
 {5867,5869},-- 16EB..16ED
 {5941,5942},-- 1735..1736
 {6146,6147},-- 1802..1803
 {7401,7404},-- 1CE9..1CEC
 {7406,7411},-- 1CEE..1CF3
 {7413,7415},-- 1CF5..1CF7
 {7424,7461},-- 1D00..1D25
 {7468,7516},-- 1D2C..1D5C
 {7522,7525},-- 1D62..1D65
 {7531,7543},-- 1D6B..1D77
 {7545,7614},-- 1D79..1DBE
 {7680,7935},-- 1E00..1EFF
 {8192,8203},-- 2000..200B
 {8206,8292},-- 200E..2064
 {8294,8304},-- 2066..2070
 {8308,8318},-- 2074..207E
 {8320,8334},-- 2080..208E
 {8336,8348},-- 2090..209C
 {8352,8384},-- 20A0..20C0
 {8448,8485},-- 2100..2125
 {8487,8497},-- 2127..2131
 {8499,8525},-- 2133..214D
 {8527,8587},-- 214F..218B
 {8592,9257},-- 2190..2429
 {9280,9290},-- 2440..244A
 {9312,10239},-- 2460..27FF
 {10496,11123},-- 2900..2B73
 {11126,11157},-- 2B76..2B95
 {11159,11263},-- 2B97..2BFF
 {11360,11391},-- 2C60..2C7F
 {11776,11869},-- 2E00..2E5D
 {12272,12292},-- 2FF0..3004
 {12296,12320},-- 3008..3020
 {12336,12343},-- 3030..3037
 {12348,12351},-- 303C..303F
 {12443,12444},-- 309B..309C
 {12539,12540},-- 30FB..30FC
 {12688,12703},-- 3190..319F
 {12736,12773},-- 31C0..31E5
 {12832,12895},-- 3220..325F
 {12927,13007},-- 327F..32CF
 {13144,13311},-- 3358..33FF
 {19904,19967},-- 4DC0..4DFF
 {42752,42957},-- A700..A7CD
 {42960,42961},-- A7D0..A7D1
 {42965,42972},-- A7D5..A7DC
 {42994,43007},-- A7F2..A7FF
 {43056,43065},-- A830..A839
 {43824,43866},-- AB30..AB5A
 {43868,43876},-- AB5C..AB64
 {43878,43883},-- AB66..AB6B
 {64256,64262},-- FB00..FB06
 {64830,64831},-- FD3E..FD3F
 {65040,65049},-- FE10..FE19
 {65072,65106},-- FE30..FE52
 {65108,65126},-- FE54..FE66
 {65128,65131},-- FE68..FE6B
 {65281,65381},-- FF01..FF65
 {65438,65439},-- FF9E..FF9F
 {65504,65510},-- FFE0..FFE6
 {65512,65518},-- FFE8..FFEE
 {65529,65533},-- FFF9..FFFD
 {65792,65794},-- 10100..10102
 {65799,65843},-- 10107..10133
 {65847,65855},-- 10137..1013F
 {65936,65948},-- 10190..1019C
 {66000,66044},-- 101D0..101FC
 {66273,66299},-- 102E1..102FB
 {67456,67461},-- 10780..10785
 {67463,67504},-- 10787..107B0
 {67506,67514},-- 107B2..107BA
 {113824,113827},-- 1BCA0..1BCA3
 {117760,118009},-- 1CC00..1CCF9
 {118016,118451},-- 1CD00..1CEB3
 {118608,118723},-- 1CF50..1CFC3
 {118784,119029},-- 1D000..1D0F5
 {119040,119078},-- 1D100..1D126
 {119081,119142},-- 1D129..1D166
 {119146,119162},-- 1D16A..1D17A
 {119171,119172},-- 1D183..1D184
 {119180,119209},-- 1D18C..1D1A9
 {119214,119274},-- 1D1AE..1D1EA
 {119488,119507},-- 1D2C0..1D2D3
 {119520,119539},-- 1D2E0..1D2F3
 {119552,119638},-- 1D300..1D356
 {119648,119672},-- 1D360..1D378
 {119808,119892},-- 1D400..1D454
 {119894,119964},-- 1D456..1D49C
 {119966,119967},-- 1D49E..1D49F
 {119973,119974},-- 1D4A5..1D4A6
 {119977,119980},-- 1D4A9..1D4AC
 {119982,119993},-- 1D4AE..1D4B9
 {119997,120003},-- 1D4BD..1D4C3
 {120005,120069},-- 1D4C5..1D505
 {120071,120074},-- 1D507..1D50A
 {120077,120084},-- 1D50D..1D514
 {120086,120092},-- 1D516..1D51C
 {120094,120121},-- 1D51E..1D539
 {120123,120126},-- 1D53B..1D53E
 {120128,120132},-- 1D540..1D544
 {120138,120144},-- 1D54A..1D550
 {120146,120485},-- 1D552..1D6A5
 {120488,120779},-- 1D6A8..1D7CB
 {120782,120831},-- 1D7CE..1D7FF
 {122624,122654},-- 1DF00..1DF1E
 {122661,122666},-- 1DF25..1DF2A
 {126065,126132},-- 1EC71..1ECB4
 {126209,126269},-- 1ED01..1ED3D
 {126976,127019},-- 1F000..1F02B
 {127024,127123},-- 1F030..1F093
 {127136,127150},-- 1F0A0..1F0AE
 {127153,127167},-- 1F0B1..1F0BF
 {127169,127183},-- 1F0C1..1F0CF
 {127185,127221},-- 1F0D1..1F0F5
 {127232,127405},-- 1F100..1F1AD
 {127462,127487},-- 1F1E6..1F1FF
 {127489,127490},-- 1F201..1F202
 {127504,127547},-- 1F210..1F23B
 {127552,127560},-- 1F240..1F248
 {127568,127569},-- 1F250..1F251
 {127584,127589},-- 1F260..1F265
 {127744,128727},-- 1F300..1F6D7
 {128732,128748},-- 1F6DC..1F6EC
 {128752,128764},-- 1F6F0..1F6FC
 {128768,128886},-- 1F700..1F776
 {128891,128985},-- 1F77B..1F7D9
 {128992,129003},-- 1F7E0..1F7EB
 {129024,129035},-- 1F800..1F80B
 {129040,129095},-- 1F810..1F847
 {129104,129113},-- 1F850..1F859
 {129120,129159},-- 1F860..1F887
 {129168,129197},-- 1F890..1F8AD
 {129200,129211},-- 1F8B0..1F8BB
 {129216,129217},-- 1F8C0..1F8C1
 {129280,129619},-- 1F900..1FA53
 {129632,129645},-- 1FA60..1FA6D
 {129648,129660},-- 1FA70..1FA7C
 {129664,129673},-- 1FA80..1FA89
 {129679,129734},-- 1FA8F..1FAC6
 {129742,129756},-- 1FACE..1FADC
 {129759,129769},-- 1FADF..1FAE9
 {129776,129784},-- 1FAF0..1FAF8
 {129792,129938},-- 1FB00..1FB92
 {129940,130041},-- 1FB94..1FBF9
 {917536,917631},-- E0020..E007F
 }


 --[[--------------------------< S P E C I A L S _ T >---------------------------------------------------------

 list of individual language-specific non-Latn and non-Zyyy codepoints; these codepoints commonly used in
 transliterations. This list is manually currated so is most likely incomplete.

 keys to <specials_t> are decimal codepoints; other keys are language tags (always lowercase) of language
 transliterations that use these non-Latn codepoints.

 ]]

 localspecials_t={
 [788]={-- U+0314: COMBINING REVERSED COMMA ABOVE
 ["hy"]=true,-- Armenian
 },
 [794]={-- U+031A: COMBINING LEFT ANGLE ABOVE
 ["ltc"]=true,-- Middle Chinese; is this really IPA?
 },
 [795]={-- U+031B: COMBINING HORN
 ["th"]=true,-- Thai
 },
 [806]={-- U+0326: COMBINING COMMA BELOW
 ["ab"]=true,-- Abkhaz
 ["kca"]=true,-- Khanty
 ["xal"]=true,-- Kalmyk or Oirat
 },
 [807]={-- U+0327: COMBINING CEDILLA
 ["fa"]=true,-- Persian
 },
 [809]={-- U+0329: COMBINING VERTICAL LINE BELOW
 ["ab"]=true,-- Abkhaz
 ["sa"]=true,-- Sanskrit
 },
 [815]={-- U+032F: COMBINING INVERTED BREVE BELOW
 ["mong"]=true,-- Mongolian
 ["xsc"]=true,-- Scythian
 },
 [818]={-- U+0332: COMBINING LOW LINE
 ["ar"]=true,-- Arabic
 ["hbo"]=true,-- Ancient Hebrew
 ["he"]=true,-- Hebrew
 ["jpa"]=true,-- Jewish Palestinian Aramaic
 ["mdh"]=true,-- Maguindanaon
 ["otk"]=true,-- Old Turkish
 },
 [831]={-- U+033F: COMBINING DOUBLE OVERLINE
 ["mnp"]=true,-- Northern Min Chinese, Jian'ou dialect
 },
 [855]={-- U+0357: COMBINING RIGHT HALF RING ABOVE
 ["egy"]=true,-- Ancient Egyptian
 },
 [863]={-- U+035F: COMBINING DOUBLE MACRON BELOW
 ["am"]=true,-- Amharic
 ["ar"]=true,-- Arabic
 ["dv"]=true,-- Dhivehi, Divehi, or Maldivian
 ["fa"]=true,-- Persian
 ["hi"]=true,-- Hindi
 ["inc"]=true,-- Indic languages
 ["ur"]=true,-- Urdu
 },
 [864]={-- U+0360: COMBINING DOUBLE TILDE
 ["hi"]=true,-- Hindi
 },
 [865]={-- U+0361: COMBINING DOUBLE INVERTED BREVE
 ["be"]=true,-- Belarusian
 ["ltc"]=true,-- Middle Chinese; is this really IPA?
 ["ru"]=true,-- Russian
 ["rue"]=true,-- Rusyn
 ["sem"]=true,-- Semitic languages
 ["sit"]=true,-- Sino-Tibetan languages
 ["tt"]=true,-- Tatar
 },
 [916]={-- U+0394: GREEK CAPITAL LETTER DELTA
 ["xsc"]=true,-- Scythian
 ["xsc-x-pontic"]=true,-- Pontic Scythian
 },
 [920]={-- U+0398: GREEK CAPITAL LETTER THETA
 ["ae"]=true,-- Avestan
 },
 [934]={-- U+03A6: GREEK CAPITAL LETTER PHI
 ["xle"]=true,-- Lemnian
 },
 [945]={-- U+03B1: GREEK SMALL LETTER ALPHA
 ["apc"]=true,-- Levantine Arabic
 },
 [946]={-- U+03B2: GREEK SMALL LETTER BETA
 ["ae"]=true,-- Avestan
 ["gha"]=true,-- Ghadamès
 ["ougr"]=true,-- Old Uyghur
 ["sem"]=true,-- Semitic languages
 ["syc"]=true,-- Classical Syriac
 ["wuu"]=true,-- Shanghainese variety of Wu Chinese
 },
 [947]={-- U+03B3: GREEK SMALL LETTER GAMMA
 ["ae"]=true,-- Avestan
 ["ltc"]=true,-- Late Middle Chinese
 ["mn"]=true,-- Mongolian
 ["och"]=true,-- Old Chinese
 ["ougr"]=true,-- Old Uyghur
 ["pal"]=true,-- Middle Persian
 ["syc"]=true,-- Classical Syriac
 ["syr"]=true,-- Syriac
 ["xal"]=true,-- Kalmyk or Oirat
 ["xng"]=true,-- Middle Mongolian
 ["xsc"]=true,-- Scythian
 ["ydg"]=true,-- Yidgha
 ["mong"]=true,-- Mongolian
 },
 [948]={-- U+03B4: GREEK SMALL LETTER DELTA
 ["ae"]=true,-- Avestan
 ["ougr"]=true,-- Old Uyghur
 ["sog"]=true,-- Sogdian
 ["sogd"]=true,-- Sogdian
 ["syc"]=true,-- Classical Syriac
 ["xpr"]=true,-- Parthian
 ["xsc"]=true,-- Scythian
 ["xsc-x-pontic"]=true,-- Pontic Scythian
 },
 [952]={-- U+03B8: GREEK SMALL LETTER THETA
 ["ae"]=true,-- Avestan
 ["ba"]=true,-- Bashkir
 ["cms"]=true,-- Messapic
 ["ett"]=true,-- Etruscan
 ["hur"]=true,-- Halkomelem
 ["ira"]=true,-- Iranian languages
 ["my"]=true,-- Burmese
 ["pal"]=true,-- Middle Persian (Pahlavi)
 ["peo"]=true,-- Old Persian
 ["sa"]=true,-- Sanskrit
 ["sem"]=true,-- Semitic languages
 ["syc"]=true,-- Classical Syriac
 ["syr"]=true,-- Syriac
 ["xme"]=true,-- Median
 ["xpg"]=true,-- Phrygian
 ["xpr"]=true,-- Parthian
 ["xsc"]=true,-- Scythian
 },
 [955]={-- U+03BB: GREEK SMALL LETTER LAMDA
 ["xcr"]=true,-- Carian
 ["xld"]=true,-- Lydian
 },
 [963]={-- U+03C3: GREEK SMALL LETTER SIGMA
 ["ett"]=true,-- Etruscan
 },
 [964]={-- U+03C4: GREEK SMALL LETTER TAU
 ["xld"]=true,-- Lydian
 },
 [966]={-- U+03C6: GREEK SMALL LETTER PHI
 ["ett"]=true,-- Etruscan
 },
 [967]={-- U+03C7: GREEK SMALL LETTER CHI
 ["ett"]=true,-- Etruscan
 ["gem"]=true,-- Germanic languages
 ["kbd"]=true,-- Kabardian
 ["ltc"]=true,-- Late Middle Chinese
 ["och"]=true,-- Old Chinese
 ["xlc"]=true,-- Lycian
 ["xle"]=true,-- Lemnian
 },
 [968]={-- U+03C8: GREEK SMALL LETTER PSI
 ["ett"]=true,-- Etruscan
 },
 [977]={-- U+03D1: GREEK THETA SYMBOL (cursive form)
 ["ae"]=true,-- Avestan
 ["ira"]=true,-- Iranian languages
 ["peo"]=true,-- Old Persian
 ["xme"]=true,-- Median
 ["xsc"]=true,-- Scythian
 ["xsc-x-pontic"]=true,-- Pontic Scythian
 },
 [1098]={-- U+044A: CYRILLIC SMALL LETTER HARD SIGN
 ["ady"]=true,-- Adyghe
 ["cu"]=true,-- Church Slavic
 ["zls"]=true,-- South Slavic languages
 },
 [1100]={-- U+044C: CYRILLIC SMALL LETTER SOFT SIGN
 ["az"]=true,-- Azerbaijani
 ["cu"]=true,-- Church Slavonic
 ["dng"]=true,-- Dungan
 ["ru"]=true,-- Russian
 ["tt"]=true,-- Tatar
 ["tyv"]=true,-- Tuvinian
 },
 [1278]={-- U+04FE: CYRILLIC CAPITAL LETTER HA WITH STROKE
 ["av"]=true,-- Avar
 },
 [1279]={-- U+04FF: CYRILLIC SMALL LETTER HA WITH STROKE
 ["av"]=true,-- Avar
 },
 [8113]={-- U+1FB1: GREEK SMALL LETTER ALPHA WITH MACRON
 ["apc"]=true,-- Levantine Arabic
 },
 [8190]={-- U+1FFE: GREEK DASIA
 ["ar"]=true,-- Arabic (Ayin)
 ["xcl"]=true,-- Classical Armenian
 },
 [19978]={-- U+4E0A: [CJK Unified Ideographs]
 ["wuu"]=true,-- Wu Chinese tone marker
 },
 [20837]={-- U+5165: [CJK Unified Ideographs]
 ["wuu"]=true,-- Wu Chinese tone marker
 },
 [21435]={-- U+53BB: [CJK Unified Ideographs]
 ["wuu"]=true,-- Wu Chinese tone marker
 },
 [24179]={-- U+5E73: [CJK Unified Ideographs]
 ["wuu"]=true,-- Wu Chinese tone marker
 },
 [38451]={-- U+9633: [CJK Unified Ideographs] (Yang)
 ["wuu"]=true,-- Suzhou dialect of Wu Chinese tone marker --[[Suzhou dialect#Tones]]
 },
 [38452]={-- U+9634: [CJK Unified Ideographs] (Yin)
 ["wuu"]=true,-- Suzhou dialect of Wu Chinese tone marker --[[Suzhou dialect#Tones]]
 },
 [65056]={-- U+FE20: COMBINING LIGATURE LEFT HALF
 ["ru"]=true,-- Russian
 },
 [65057]={-- U+FE21: COMBINING LIGATURE RIGHT HALF
 ["ru"]=true,-- Russian
 },
 }


 --[[--------------------------< E X P O R T S >---------------------------------------------------------------
 ]]

 return{
 ranges_t=ranges_t,
 singles_t=singles_t,
 specials_t=specials_t,

 sizeof_ranges_t=#ranges_t,
 }

AltStyle によって変換されたページ (->オリジナル) /