IDNA2.php 94 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412
  1. <?php
  2. // {{{ license{{{{{{{{{
  3. /* vim: set expandtab tabstop=4 shiftwidth=4 softtabstop=4 foldmethod=marker: */
  4. //
  5. // +----------------------------------------------------------------------+
  6. // | This library is free software; you can redistribute it and/or modify |
  7. // | it under the terms of the GNU Lesser General Public License as |
  8. // | published by the Free Software Foundation; either version 2.1 of the |
  9. // | License, or (at your option) any later version. |
  10. // | |
  11. // | This library is distributed in the hope that it will be useful, but |
  12. // | WITHOUT ANY WARRANTY; without even the implied warranty of |
  13. // | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
  14. // | Lesser General Public License for more details. |
  15. // | |
  16. // | You should have received a copy of the GNU Lesser General Public |
  17. // | License along with this library; if not, write to the Free Software |
  18. // | Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 |
  19. // | USA. |
  20. // +----------------------------------------------------------------------+
  21. //
  22. // }}}}}}}}}}}}
  23. require_once 'Net/IDNA2/Exception.php';
  24. require_once 'Net/IDNA2/Exception/Nameprep.php';
  25. /**
  26. * Encode/decode Internationalized Domain Names.
  27. *
  28. * The class allows one to convert internationalized domain names
  29. * (see RFC 3490 for details) as they can be used with various registries worldwide
  30. * to be translated between their original (localized) form and their encoded form
  31. * as it will be used in the DNS (Domain Name System).
  32. *
  33. * The class provides two public methods, encode() and decode(), which do exactly
  34. * what you would expect them to do. You are allowed to use complete domain names,
  35. * simple strings and complete email addresses as well. That means, that you might
  36. * use any of the following notations:
  37. *
  38. * - www.n�rgler.com
  39. * - xn--nrgler-wxa
  40. * - xn--brse-5qa.xn--knrz-1ra.info
  41. *
  42. * Unicode input might be given as either UTF-8 string, UCS-4 string or UCS-4
  43. * array. Unicode output is available in the same formats.
  44. * You can select your preferred format via {@link set_paramter()}.
  45. *
  46. * ACE input and output is always expected to be ASCII.
  47. *
  48. * @package Net
  49. * @author Markus Nix <mnix@docuverse.de>
  50. * @author Matthias Sommerfeld <mso@phlylabs.de>
  51. * @author Stefan Neufeind <pear.neufeind@speedpartner.de>
  52. * @version $Id$
  53. */
  54. class Net_IDNA2
  55. {
  56. // {{{ npdata
  57. /**
  58. * These Unicode codepoints are
  59. * mapped to nothing, See RFC3454 for details
  60. *
  61. * @static
  62. * @var array
  63. * @access private
  64. */
  65. private static $_np_map_nothing = [
  66. 0xAD,
  67. 0x34F,
  68. 0x1806,
  69. 0x180B,
  70. 0x180C,
  71. 0x180D,
  72. 0x200B,
  73. 0x200C,
  74. 0x200D,
  75. 0x2060,
  76. 0xFE00,
  77. 0xFE01,
  78. 0xFE02,
  79. 0xFE03,
  80. 0xFE04,
  81. 0xFE05,
  82. 0xFE06,
  83. 0xFE07,
  84. 0xFE08,
  85. 0xFE09,
  86. 0xFE0A,
  87. 0xFE0B,
  88. 0xFE0C,
  89. 0xFE0D,
  90. 0xFE0E,
  91. 0xFE0F,
  92. 0xFEFF
  93. ];
  94. /**
  95. * Prohibited codepints
  96. *
  97. * @static
  98. * @var array
  99. * @access private
  100. */
  101. private static $_general_prohibited = [
  102. 0,
  103. 1,
  104. 2,
  105. 3,
  106. 4,
  107. 5,
  108. 6,
  109. 7,
  110. 8,
  111. 9,
  112. 0xA,
  113. 0xB,
  114. 0xC,
  115. 0xD,
  116. 0xE,
  117. 0xF,
  118. 0x10,
  119. 0x11,
  120. 0x12,
  121. 0x13,
  122. 0x14,
  123. 0x15,
  124. 0x16,
  125. 0x17,
  126. 0x18,
  127. 0x19,
  128. 0x1A,
  129. 0x1B,
  130. 0x1C,
  131. 0x1D,
  132. 0x1E,
  133. 0x1F,
  134. 0x20,
  135. 0x21,
  136. 0x22,
  137. 0x23,
  138. 0x24,
  139. 0x25,
  140. 0x26,
  141. 0x27,
  142. 0x28,
  143. 0x29,
  144. 0x2A,
  145. 0x2B,
  146. 0x2C,
  147. 0x2F,
  148. 0x3B,
  149. 0x3C,
  150. 0x3D,
  151. 0x3E,
  152. 0x3F,
  153. 0x40,
  154. 0x5B,
  155. 0x5C,
  156. 0x5D,
  157. 0x5E,
  158. 0x5F,
  159. 0x60,
  160. 0x7B,
  161. 0x7C,
  162. 0x7D,
  163. 0x7E,
  164. 0x7F,
  165. 0x3002
  166. ];
  167. /**
  168. * Codepints prohibited by Nameprep
  169. * @static
  170. * @var array
  171. * @access private
  172. */
  173. private static $_np_prohibit = [
  174. 0xA0,
  175. 0x1680,
  176. 0x2000,
  177. 0x2001,
  178. 0x2002,
  179. 0x2003,
  180. 0x2004,
  181. 0x2005,
  182. 0x2006,
  183. 0x2007,
  184. 0x2008,
  185. 0x2009,
  186. 0x200A,
  187. 0x200B,
  188. 0x202F,
  189. 0x205F,
  190. 0x3000,
  191. 0x6DD,
  192. 0x70F,
  193. 0x180E,
  194. 0x200C,
  195. 0x200D,
  196. 0x2028,
  197. 0x2029,
  198. 0xFEFF,
  199. 0xFFF9,
  200. 0xFFFA,
  201. 0xFFFB,
  202. 0xFFFC,
  203. 0xFFFE,
  204. 0xFFFF,
  205. 0x1FFFE,
  206. 0x1FFFF,
  207. 0x2FFFE,
  208. 0x2FFFF,
  209. 0x3FFFE,
  210. 0x3FFFF,
  211. 0x4FFFE,
  212. 0x4FFFF,
  213. 0x5FFFE,
  214. 0x5FFFF,
  215. 0x6FFFE,
  216. 0x6FFFF,
  217. 0x7FFFE,
  218. 0x7FFFF,
  219. 0x8FFFE,
  220. 0x8FFFF,
  221. 0x9FFFE,
  222. 0x9FFFF,
  223. 0xAFFFE,
  224. 0xAFFFF,
  225. 0xBFFFE,
  226. 0xBFFFF,
  227. 0xCFFFE,
  228. 0xCFFFF,
  229. 0xDFFFE,
  230. 0xDFFFF,
  231. 0xEFFFE,
  232. 0xEFFFF,
  233. 0xFFFFE,
  234. 0xFFFFF,
  235. 0x10FFFE,
  236. 0x10FFFF,
  237. 0xFFF9,
  238. 0xFFFA,
  239. 0xFFFB,
  240. 0xFFFC,
  241. 0xFFFD,
  242. 0x340,
  243. 0x341,
  244. 0x200E,
  245. 0x200F,
  246. 0x202A,
  247. 0x202B,
  248. 0x202C,
  249. 0x202D,
  250. 0x202E,
  251. 0x206A,
  252. 0x206B,
  253. 0x206C,
  254. 0x206D,
  255. 0x206E,
  256. 0x206F,
  257. 0xE0001
  258. ];
  259. /**
  260. * Codepoint ranges prohibited by nameprep
  261. *
  262. * @static
  263. * @var array
  264. * @access private
  265. */
  266. private static $_np_prohibit_ranges = [
  267. [0x80, 0x9F],
  268. [0x2060, 0x206F],
  269. [0x1D173, 0x1D17A],
  270. [0xE000, 0xF8FF],
  271. [0xF0000, 0xFFFFD],
  272. [0x100000, 0x10FFFD],
  273. [0xFDD0, 0xFDEF],
  274. [0xD800, 0xDFFF],
  275. [0x2FF0, 0x2FFB],
  276. [0xE0020, 0xE007F]
  277. ];
  278. /**
  279. * Replacement mappings (casemapping, replacement sequences, ...)
  280. *
  281. * @static
  282. * @var array
  283. * @access private
  284. */
  285. private static $_np_replacemaps = [
  286. 0x41 => [0x61],
  287. 0x42 => [0x62],
  288. 0x43 => [0x63],
  289. 0x44 => [0x64],
  290. 0x45 => [0x65],
  291. 0x46 => [0x66],
  292. 0x47 => [0x67],
  293. 0x48 => [0x68],
  294. 0x49 => [0x69],
  295. 0x4A => [0x6A],
  296. 0x4B => [0x6B],
  297. 0x4C => [0x6C],
  298. 0x4D => [0x6D],
  299. 0x4E => [0x6E],
  300. 0x4F => [0x6F],
  301. 0x50 => [0x70],
  302. 0x51 => [0x71],
  303. 0x52 => [0x72],
  304. 0x53 => [0x73],
  305. 0x54 => [0x74],
  306. 0x55 => [0x75],
  307. 0x56 => [0x76],
  308. 0x57 => [0x77],
  309. 0x58 => [0x78],
  310. 0x59 => [0x79],
  311. 0x5A => [0x7A],
  312. 0xB5 => [0x3BC],
  313. 0xC0 => [0xE0],
  314. 0xC1 => [0xE1],
  315. 0xC2 => [0xE2],
  316. 0xC3 => [0xE3],
  317. 0xC4 => [0xE4],
  318. 0xC5 => [0xE5],
  319. 0xC6 => [0xE6],
  320. 0xC7 => [0xE7],
  321. 0xC8 => [0xE8],
  322. 0xC9 => [0xE9],
  323. 0xCA => [0xEA],
  324. 0xCB => [0xEB],
  325. 0xCC => [0xEC],
  326. 0xCD => [0xED],
  327. 0xCE => [0xEE],
  328. 0xCF => [0xEF],
  329. 0xD0 => [0xF0],
  330. 0xD1 => [0xF1],
  331. 0xD2 => [0xF2],
  332. 0xD3 => [0xF3],
  333. 0xD4 => [0xF4],
  334. 0xD5 => [0xF5],
  335. 0xD6 => [0xF6],
  336. 0xD8 => [0xF8],
  337. 0xD9 => [0xF9],
  338. 0xDA => [0xFA],
  339. 0xDB => [0xFB],
  340. 0xDC => [0xFC],
  341. 0xDD => [0xFD],
  342. 0xDE => [0xFE],
  343. 0xDF => [0x73, 0x73],
  344. 0x100 => [0x101],
  345. 0x102 => [0x103],
  346. 0x104 => [0x105],
  347. 0x106 => [0x107],
  348. 0x108 => [0x109],
  349. 0x10A => [0x10B],
  350. 0x10C => [0x10D],
  351. 0x10E => [0x10F],
  352. 0x110 => [0x111],
  353. 0x112 => [0x113],
  354. 0x114 => [0x115],
  355. 0x116 => [0x117],
  356. 0x118 => [0x119],
  357. 0x11A => [0x11B],
  358. 0x11C => [0x11D],
  359. 0x11E => [0x11F],
  360. 0x120 => [0x121],
  361. 0x122 => [0x123],
  362. 0x124 => [0x125],
  363. 0x126 => [0x127],
  364. 0x128 => [0x129],
  365. 0x12A => [0x12B],
  366. 0x12C => [0x12D],
  367. 0x12E => [0x12F],
  368. 0x130 => [0x69, 0x307],
  369. 0x132 => [0x133],
  370. 0x134 => [0x135],
  371. 0x136 => [0x137],
  372. 0x139 => [0x13A],
  373. 0x13B => [0x13C],
  374. 0x13D => [0x13E],
  375. 0x13F => [0x140],
  376. 0x141 => [0x142],
  377. 0x143 => [0x144],
  378. 0x145 => [0x146],
  379. 0x147 => [0x148],
  380. 0x149 => [0x2BC, 0x6E],
  381. 0x14A => [0x14B],
  382. 0x14C => [0x14D],
  383. 0x14E => [0x14F],
  384. 0x150 => [0x151],
  385. 0x152 => [0x153],
  386. 0x154 => [0x155],
  387. 0x156 => [0x157],
  388. 0x158 => [0x159],
  389. 0x15A => [0x15B],
  390. 0x15C => [0x15D],
  391. 0x15E => [0x15F],
  392. 0x160 => [0x161],
  393. 0x162 => [0x163],
  394. 0x164 => [0x165],
  395. 0x166 => [0x167],
  396. 0x168 => [0x169],
  397. 0x16A => [0x16B],
  398. 0x16C => [0x16D],
  399. 0x16E => [0x16F],
  400. 0x170 => [0x171],
  401. 0x172 => [0x173],
  402. 0x174 => [0x175],
  403. 0x176 => [0x177],
  404. 0x178 => [0xFF],
  405. 0x179 => [0x17A],
  406. 0x17B => [0x17C],
  407. 0x17D => [0x17E],
  408. 0x17F => [0x73],
  409. 0x181 => [0x253],
  410. 0x182 => [0x183],
  411. 0x184 => [0x185],
  412. 0x186 => [0x254],
  413. 0x187 => [0x188],
  414. 0x189 => [0x256],
  415. 0x18A => [0x257],
  416. 0x18B => [0x18C],
  417. 0x18E => [0x1DD],
  418. 0x18F => [0x259],
  419. 0x190 => [0x25B],
  420. 0x191 => [0x192],
  421. 0x193 => [0x260],
  422. 0x194 => [0x263],
  423. 0x196 => [0x269],
  424. 0x197 => [0x268],
  425. 0x198 => [0x199],
  426. 0x19C => [0x26F],
  427. 0x19D => [0x272],
  428. 0x19F => [0x275],
  429. 0x1A0 => [0x1A1],
  430. 0x1A2 => [0x1A3],
  431. 0x1A4 => [0x1A5],
  432. 0x1A6 => [0x280],
  433. 0x1A7 => [0x1A8],
  434. 0x1A9 => [0x283],
  435. 0x1AC => [0x1AD],
  436. 0x1AE => [0x288],
  437. 0x1AF => [0x1B0],
  438. 0x1B1 => [0x28A],
  439. 0x1B2 => [0x28B],
  440. 0x1B3 => [0x1B4],
  441. 0x1B5 => [0x1B6],
  442. 0x1B7 => [0x292],
  443. 0x1B8 => [0x1B9],
  444. 0x1BC => [0x1BD],
  445. 0x1C4 => [0x1C6],
  446. 0x1C5 => [0x1C6],
  447. 0x1C7 => [0x1C9],
  448. 0x1C8 => [0x1C9],
  449. 0x1CA => [0x1CC],
  450. 0x1CB => [0x1CC],
  451. 0x1CD => [0x1CE],
  452. 0x1CF => [0x1D0],
  453. 0x1D1 => [0x1D2],
  454. 0x1D3 => [0x1D4],
  455. 0x1D5 => [0x1D6],
  456. 0x1D7 => [0x1D8],
  457. 0x1D9 => [0x1DA],
  458. 0x1DB => [0x1DC],
  459. 0x1DE => [0x1DF],
  460. 0x1E0 => [0x1E1],
  461. 0x1E2 => [0x1E3],
  462. 0x1E4 => [0x1E5],
  463. 0x1E6 => [0x1E7],
  464. 0x1E8 => [0x1E9],
  465. 0x1EA => [0x1EB],
  466. 0x1EC => [0x1ED],
  467. 0x1EE => [0x1EF],
  468. 0x1F0 => [0x6A, 0x30C],
  469. 0x1F1 => [0x1F3],
  470. 0x1F2 => [0x1F3],
  471. 0x1F4 => [0x1F5],
  472. 0x1F6 => [0x195],
  473. 0x1F7 => [0x1BF],
  474. 0x1F8 => [0x1F9],
  475. 0x1FA => [0x1FB],
  476. 0x1FC => [0x1FD],
  477. 0x1FE => [0x1FF],
  478. 0x200 => [0x201],
  479. 0x202 => [0x203],
  480. 0x204 => [0x205],
  481. 0x206 => [0x207],
  482. 0x208 => [0x209],
  483. 0x20A => [0x20B],
  484. 0x20C => [0x20D],
  485. 0x20E => [0x20F],
  486. 0x210 => [0x211],
  487. 0x212 => [0x213],
  488. 0x214 => [0x215],
  489. 0x216 => [0x217],
  490. 0x218 => [0x219],
  491. 0x21A => [0x21B],
  492. 0x21C => [0x21D],
  493. 0x21E => [0x21F],
  494. 0x220 => [0x19E],
  495. 0x222 => [0x223],
  496. 0x224 => [0x225],
  497. 0x226 => [0x227],
  498. 0x228 => [0x229],
  499. 0x22A => [0x22B],
  500. 0x22C => [0x22D],
  501. 0x22E => [0x22F],
  502. 0x230 => [0x231],
  503. 0x232 => [0x233],
  504. 0x345 => [0x3B9],
  505. 0x37A => [0x20, 0x3B9],
  506. 0x386 => [0x3AC],
  507. 0x388 => [0x3AD],
  508. 0x389 => [0x3AE],
  509. 0x38A => [0x3AF],
  510. 0x38C => [0x3CC],
  511. 0x38E => [0x3CD],
  512. 0x38F => [0x3CE],
  513. 0x390 => [0x3B9, 0x308, 0x301],
  514. 0x391 => [0x3B1],
  515. 0x392 => [0x3B2],
  516. 0x393 => [0x3B3],
  517. 0x394 => [0x3B4],
  518. 0x395 => [0x3B5],
  519. 0x396 => [0x3B6],
  520. 0x397 => [0x3B7],
  521. 0x398 => [0x3B8],
  522. 0x399 => [0x3B9],
  523. 0x39A => [0x3BA],
  524. 0x39B => [0x3BB],
  525. 0x39C => [0x3BC],
  526. 0x39D => [0x3BD],
  527. 0x39E => [0x3BE],
  528. 0x39F => [0x3BF],
  529. 0x3A0 => [0x3C0],
  530. 0x3A1 => [0x3C1],
  531. 0x3A3 => [0x3C3],
  532. 0x3A4 => [0x3C4],
  533. 0x3A5 => [0x3C5],
  534. 0x3A6 => [0x3C6],
  535. 0x3A7 => [0x3C7],
  536. 0x3A8 => [0x3C8],
  537. 0x3A9 => [0x3C9],
  538. 0x3AA => [0x3CA],
  539. 0x3AB => [0x3CB],
  540. 0x3B0 => [0x3C5, 0x308, 0x301],
  541. 0x3C2 => [0x3C3],
  542. 0x3D0 => [0x3B2],
  543. 0x3D1 => [0x3B8],
  544. 0x3D2 => [0x3C5],
  545. 0x3D3 => [0x3CD],
  546. 0x3D4 => [0x3CB],
  547. 0x3D5 => [0x3C6],
  548. 0x3D6 => [0x3C0],
  549. 0x3D8 => [0x3D9],
  550. 0x3DA => [0x3DB],
  551. 0x3DC => [0x3DD],
  552. 0x3DE => [0x3DF],
  553. 0x3E0 => [0x3E1],
  554. 0x3E2 => [0x3E3],
  555. 0x3E4 => [0x3E5],
  556. 0x3E6 => [0x3E7],
  557. 0x3E8 => [0x3E9],
  558. 0x3EA => [0x3EB],
  559. 0x3EC => [0x3ED],
  560. 0x3EE => [0x3EF],
  561. 0x3F0 => [0x3BA],
  562. 0x3F1 => [0x3C1],
  563. 0x3F2 => [0x3C3],
  564. 0x3F4 => [0x3B8],
  565. 0x3F5 => [0x3B5],
  566. 0x400 => [0x450],
  567. 0x401 => [0x451],
  568. 0x402 => [0x452],
  569. 0x403 => [0x453],
  570. 0x404 => [0x454],
  571. 0x405 => [0x455],
  572. 0x406 => [0x456],
  573. 0x407 => [0x457],
  574. 0x408 => [0x458],
  575. 0x409 => [0x459],
  576. 0x40A => [0x45A],
  577. 0x40B => [0x45B],
  578. 0x40C => [0x45C],
  579. 0x40D => [0x45D],
  580. 0x40E => [0x45E],
  581. 0x40F => [0x45F],
  582. 0x410 => [0x430],
  583. 0x411 => [0x431],
  584. 0x412 => [0x432],
  585. 0x413 => [0x433],
  586. 0x414 => [0x434],
  587. 0x415 => [0x435],
  588. 0x416 => [0x436],
  589. 0x417 => [0x437],
  590. 0x418 => [0x438],
  591. 0x419 => [0x439],
  592. 0x41A => [0x43A],
  593. 0x41B => [0x43B],
  594. 0x41C => [0x43C],
  595. 0x41D => [0x43D],
  596. 0x41E => [0x43E],
  597. 0x41F => [0x43F],
  598. 0x420 => [0x440],
  599. 0x421 => [0x441],
  600. 0x422 => [0x442],
  601. 0x423 => [0x443],
  602. 0x424 => [0x444],
  603. 0x425 => [0x445],
  604. 0x426 => [0x446],
  605. 0x427 => [0x447],
  606. 0x428 => [0x448],
  607. 0x429 => [0x449],
  608. 0x42A => [0x44A],
  609. 0x42B => [0x44B],
  610. 0x42C => [0x44C],
  611. 0x42D => [0x44D],
  612. 0x42E => [0x44E],
  613. 0x42F => [0x44F],
  614. 0x460 => [0x461],
  615. 0x462 => [0x463],
  616. 0x464 => [0x465],
  617. 0x466 => [0x467],
  618. 0x468 => [0x469],
  619. 0x46A => [0x46B],
  620. 0x46C => [0x46D],
  621. 0x46E => [0x46F],
  622. 0x470 => [0x471],
  623. 0x472 => [0x473],
  624. 0x474 => [0x475],
  625. 0x476 => [0x477],
  626. 0x478 => [0x479],
  627. 0x47A => [0x47B],
  628. 0x47C => [0x47D],
  629. 0x47E => [0x47F],
  630. 0x480 => [0x481],
  631. 0x48A => [0x48B],
  632. 0x48C => [0x48D],
  633. 0x48E => [0x48F],
  634. 0x490 => [0x491],
  635. 0x492 => [0x493],
  636. 0x494 => [0x495],
  637. 0x496 => [0x497],
  638. 0x498 => [0x499],
  639. 0x49A => [0x49B],
  640. 0x49C => [0x49D],
  641. 0x49E => [0x49F],
  642. 0x4A0 => [0x4A1],
  643. 0x4A2 => [0x4A3],
  644. 0x4A4 => [0x4A5],
  645. 0x4A6 => [0x4A7],
  646. 0x4A8 => [0x4A9],
  647. 0x4AA => [0x4AB],
  648. 0x4AC => [0x4AD],
  649. 0x4AE => [0x4AF],
  650. 0x4B0 => [0x4B1],
  651. 0x4B2 => [0x4B3],
  652. 0x4B4 => [0x4B5],
  653. 0x4B6 => [0x4B7],
  654. 0x4B8 => [0x4B9],
  655. 0x4BA => [0x4BB],
  656. 0x4BC => [0x4BD],
  657. 0x4BE => [0x4BF],
  658. 0x4C1 => [0x4C2],
  659. 0x4C3 => [0x4C4],
  660. 0x4C5 => [0x4C6],
  661. 0x4C7 => [0x4C8],
  662. 0x4C9 => [0x4CA],
  663. 0x4CB => [0x4CC],
  664. 0x4CD => [0x4CE],
  665. 0x4D0 => [0x4D1],
  666. 0x4D2 => [0x4D3],
  667. 0x4D4 => [0x4D5],
  668. 0x4D6 => [0x4D7],
  669. 0x4D8 => [0x4D9],
  670. 0x4DA => [0x4DB],
  671. 0x4DC => [0x4DD],
  672. 0x4DE => [0x4DF],
  673. 0x4E0 => [0x4E1],
  674. 0x4E2 => [0x4E3],
  675. 0x4E4 => [0x4E5],
  676. 0x4E6 => [0x4E7],
  677. 0x4E8 => [0x4E9],
  678. 0x4EA => [0x4EB],
  679. 0x4EC => [0x4ED],
  680. 0x4EE => [0x4EF],
  681. 0x4F0 => [0x4F1],
  682. 0x4F2 => [0x4F3],
  683. 0x4F4 => [0x4F5],
  684. 0x4F8 => [0x4F9],
  685. 0x500 => [0x501],
  686. 0x502 => [0x503],
  687. 0x504 => [0x505],
  688. 0x506 => [0x507],
  689. 0x508 => [0x509],
  690. 0x50A => [0x50B],
  691. 0x50C => [0x50D],
  692. 0x50E => [0x50F],
  693. 0x531 => [0x561],
  694. 0x532 => [0x562],
  695. 0x533 => [0x563],
  696. 0x534 => [0x564],
  697. 0x535 => [0x565],
  698. 0x536 => [0x566],
  699. 0x537 => [0x567],
  700. 0x538 => [0x568],
  701. 0x539 => [0x569],
  702. 0x53A => [0x56A],
  703. 0x53B => [0x56B],
  704. 0x53C => [0x56C],
  705. 0x53D => [0x56D],
  706. 0x53E => [0x56E],
  707. 0x53F => [0x56F],
  708. 0x540 => [0x570],
  709. 0x541 => [0x571],
  710. 0x542 => [0x572],
  711. 0x543 => [0x573],
  712. 0x544 => [0x574],
  713. 0x545 => [0x575],
  714. 0x546 => [0x576],
  715. 0x547 => [0x577],
  716. 0x548 => [0x578],
  717. 0x549 => [0x579],
  718. 0x54A => [0x57A],
  719. 0x54B => [0x57B],
  720. 0x54C => [0x57C],
  721. 0x54D => [0x57D],
  722. 0x54E => [0x57E],
  723. 0x54F => [0x57F],
  724. 0x550 => [0x580],
  725. 0x551 => [0x581],
  726. 0x552 => [0x582],
  727. 0x553 => [0x583],
  728. 0x554 => [0x584],
  729. 0x555 => [0x585],
  730. 0x556 => [0x586],
  731. 0x587 => [0x565, 0x582],
  732. 0x1E00 => [0x1E01],
  733. 0x1E02 => [0x1E03],
  734. 0x1E04 => [0x1E05],
  735. 0x1E06 => [0x1E07],
  736. 0x1E08 => [0x1E09],
  737. 0x1E0A => [0x1E0B],
  738. 0x1E0C => [0x1E0D],
  739. 0x1E0E => [0x1E0F],
  740. 0x1E10 => [0x1E11],
  741. 0x1E12 => [0x1E13],
  742. 0x1E14 => [0x1E15],
  743. 0x1E16 => [0x1E17],
  744. 0x1E18 => [0x1E19],
  745. 0x1E1A => [0x1E1B],
  746. 0x1E1C => [0x1E1D],
  747. 0x1E1E => [0x1E1F],
  748. 0x1E20 => [0x1E21],
  749. 0x1E22 => [0x1E23],
  750. 0x1E24 => [0x1E25],
  751. 0x1E26 => [0x1E27],
  752. 0x1E28 => [0x1E29],
  753. 0x1E2A => [0x1E2B],
  754. 0x1E2C => [0x1E2D],
  755. 0x1E2E => [0x1E2F],
  756. 0x1E30 => [0x1E31],
  757. 0x1E32 => [0x1E33],
  758. 0x1E34 => [0x1E35],
  759. 0x1E36 => [0x1E37],
  760. 0x1E38 => [0x1E39],
  761. 0x1E3A => [0x1E3B],
  762. 0x1E3C => [0x1E3D],
  763. 0x1E3E => [0x1E3F],
  764. 0x1E40 => [0x1E41],
  765. 0x1E42 => [0x1E43],
  766. 0x1E44 => [0x1E45],
  767. 0x1E46 => [0x1E47],
  768. 0x1E48 => [0x1E49],
  769. 0x1E4A => [0x1E4B],
  770. 0x1E4C => [0x1E4D],
  771. 0x1E4E => [0x1E4F],
  772. 0x1E50 => [0x1E51],
  773. 0x1E52 => [0x1E53],
  774. 0x1E54 => [0x1E55],
  775. 0x1E56 => [0x1E57],
  776. 0x1E58 => [0x1E59],
  777. 0x1E5A => [0x1E5B],
  778. 0x1E5C => [0x1E5D],
  779. 0x1E5E => [0x1E5F],
  780. 0x1E60 => [0x1E61],
  781. 0x1E62 => [0x1E63],
  782. 0x1E64 => [0x1E65],
  783. 0x1E66 => [0x1E67],
  784. 0x1E68 => [0x1E69],
  785. 0x1E6A => [0x1E6B],
  786. 0x1E6C => [0x1E6D],
  787. 0x1E6E => [0x1E6F],
  788. 0x1E70 => [0x1E71],
  789. 0x1E72 => [0x1E73],
  790. 0x1E74 => [0x1E75],
  791. 0x1E76 => [0x1E77],
  792. 0x1E78 => [0x1E79],
  793. 0x1E7A => [0x1E7B],
  794. 0x1E7C => [0x1E7D],
  795. 0x1E7E => [0x1E7F],
  796. 0x1E80 => [0x1E81],
  797. 0x1E82 => [0x1E83],
  798. 0x1E84 => [0x1E85],
  799. 0x1E86 => [0x1E87],
  800. 0x1E88 => [0x1E89],
  801. 0x1E8A => [0x1E8B],
  802. 0x1E8C => [0x1E8D],
  803. 0x1E8E => [0x1E8F],
  804. 0x1E90 => [0x1E91],
  805. 0x1E92 => [0x1E93],
  806. 0x1E94 => [0x1E95],
  807. 0x1E96 => [0x68, 0x331],
  808. 0x1E97 => [0x74, 0x308],
  809. 0x1E98 => [0x77, 0x30A],
  810. 0x1E99 => [0x79, 0x30A],
  811. 0x1E9A => [0x61, 0x2BE],
  812. 0x1E9B => [0x1E61],
  813. 0x1EA0 => [0x1EA1],
  814. 0x1EA2 => [0x1EA3],
  815. 0x1EA4 => [0x1EA5],
  816. 0x1EA6 => [0x1EA7],
  817. 0x1EA8 => [0x1EA9],
  818. 0x1EAA => [0x1EAB],
  819. 0x1EAC => [0x1EAD],
  820. 0x1EAE => [0x1EAF],
  821. 0x1EB0 => [0x1EB1],
  822. 0x1EB2 => [0x1EB3],
  823. 0x1EB4 => [0x1EB5],
  824. 0x1EB6 => [0x1EB7],
  825. 0x1EB8 => [0x1EB9],
  826. 0x1EBA => [0x1EBB],
  827. 0x1EBC => [0x1EBD],
  828. 0x1EBE => [0x1EBF],
  829. 0x1EC0 => [0x1EC1],
  830. 0x1EC2 => [0x1EC3],
  831. 0x1EC4 => [0x1EC5],
  832. 0x1EC6 => [0x1EC7],
  833. 0x1EC8 => [0x1EC9],
  834. 0x1ECA => [0x1ECB],
  835. 0x1ECC => [0x1ECD],
  836. 0x1ECE => [0x1ECF],
  837. 0x1ED0 => [0x1ED1],
  838. 0x1ED2 => [0x1ED3],
  839. 0x1ED4 => [0x1ED5],
  840. 0x1ED6 => [0x1ED7],
  841. 0x1ED8 => [0x1ED9],
  842. 0x1EDA => [0x1EDB],
  843. 0x1EDC => [0x1EDD],
  844. 0x1EDE => [0x1EDF],
  845. 0x1EE0 => [0x1EE1],
  846. 0x1EE2 => [0x1EE3],
  847. 0x1EE4 => [0x1EE5],
  848. 0x1EE6 => [0x1EE7],
  849. 0x1EE8 => [0x1EE9],
  850. 0x1EEA => [0x1EEB],
  851. 0x1EEC => [0x1EED],
  852. 0x1EEE => [0x1EEF],
  853. 0x1EF0 => [0x1EF1],
  854. 0x1EF2 => [0x1EF3],
  855. 0x1EF4 => [0x1EF5],
  856. 0x1EF6 => [0x1EF7],
  857. 0x1EF8 => [0x1EF9],
  858. 0x1F08 => [0x1F00],
  859. 0x1F09 => [0x1F01],
  860. 0x1F0A => [0x1F02],
  861. 0x1F0B => [0x1F03],
  862. 0x1F0C => [0x1F04],
  863. 0x1F0D => [0x1F05],
  864. 0x1F0E => [0x1F06],
  865. 0x1F0F => [0x1F07],
  866. 0x1F18 => [0x1F10],
  867. 0x1F19 => [0x1F11],
  868. 0x1F1A => [0x1F12],
  869. 0x1F1B => [0x1F13],
  870. 0x1F1C => [0x1F14],
  871. 0x1F1D => [0x1F15],
  872. 0x1F28 => [0x1F20],
  873. 0x1F29 => [0x1F21],
  874. 0x1F2A => [0x1F22],
  875. 0x1F2B => [0x1F23],
  876. 0x1F2C => [0x1F24],
  877. 0x1F2D => [0x1F25],
  878. 0x1F2E => [0x1F26],
  879. 0x1F2F => [0x1F27],
  880. 0x1F38 => [0x1F30],
  881. 0x1F39 => [0x1F31],
  882. 0x1F3A => [0x1F32],
  883. 0x1F3B => [0x1F33],
  884. 0x1F3C => [0x1F34],
  885. 0x1F3D => [0x1F35],
  886. 0x1F3E => [0x1F36],
  887. 0x1F3F => [0x1F37],
  888. 0x1F48 => [0x1F40],
  889. 0x1F49 => [0x1F41],
  890. 0x1F4A => [0x1F42],
  891. 0x1F4B => [0x1F43],
  892. 0x1F4C => [0x1F44],
  893. 0x1F4D => [0x1F45],
  894. 0x1F50 => [0x3C5, 0x313],
  895. 0x1F52 => [0x3C5, 0x313, 0x300],
  896. 0x1F54 => [0x3C5, 0x313, 0x301],
  897. 0x1F56 => [0x3C5, 0x313, 0x342],
  898. 0x1F59 => [0x1F51],
  899. 0x1F5B => [0x1F53],
  900. 0x1F5D => [0x1F55],
  901. 0x1F5F => [0x1F57],
  902. 0x1F68 => [0x1F60],
  903. 0x1F69 => [0x1F61],
  904. 0x1F6A => [0x1F62],
  905. 0x1F6B => [0x1F63],
  906. 0x1F6C => [0x1F64],
  907. 0x1F6D => [0x1F65],
  908. 0x1F6E => [0x1F66],
  909. 0x1F6F => [0x1F67],
  910. 0x1F80 => [0x1F00, 0x3B9],
  911. 0x1F81 => [0x1F01, 0x3B9],
  912. 0x1F82 => [0x1F02, 0x3B9],
  913. 0x1F83 => [0x1F03, 0x3B9],
  914. 0x1F84 => [0x1F04, 0x3B9],
  915. 0x1F85 => [0x1F05, 0x3B9],
  916. 0x1F86 => [0x1F06, 0x3B9],
  917. 0x1F87 => [0x1F07, 0x3B9],
  918. 0x1F88 => [0x1F00, 0x3B9],
  919. 0x1F89 => [0x1F01, 0x3B9],
  920. 0x1F8A => [0x1F02, 0x3B9],
  921. 0x1F8B => [0x1F03, 0x3B9],
  922. 0x1F8C => [0x1F04, 0x3B9],
  923. 0x1F8D => [0x1F05, 0x3B9],
  924. 0x1F8E => [0x1F06, 0x3B9],
  925. 0x1F8F => [0x1F07, 0x3B9],
  926. 0x1F90 => [0x1F20, 0x3B9],
  927. 0x1F91 => [0x1F21, 0x3B9],
  928. 0x1F92 => [0x1F22, 0x3B9],
  929. 0x1F93 => [0x1F23, 0x3B9],
  930. 0x1F94 => [0x1F24, 0x3B9],
  931. 0x1F95 => [0x1F25, 0x3B9],
  932. 0x1F96 => [0x1F26, 0x3B9],
  933. 0x1F97 => [0x1F27, 0x3B9],
  934. 0x1F98 => [0x1F20, 0x3B9],
  935. 0x1F99 => [0x1F21, 0x3B9],
  936. 0x1F9A => [0x1F22, 0x3B9],
  937. 0x1F9B => [0x1F23, 0x3B9],
  938. 0x1F9C => [0x1F24, 0x3B9],
  939. 0x1F9D => [0x1F25, 0x3B9],
  940. 0x1F9E => [0x1F26, 0x3B9],
  941. 0x1F9F => [0x1F27, 0x3B9],
  942. 0x1FA0 => [0x1F60, 0x3B9],
  943. 0x1FA1 => [0x1F61, 0x3B9],
  944. 0x1FA2 => [0x1F62, 0x3B9],
  945. 0x1FA3 => [0x1F63, 0x3B9],
  946. 0x1FA4 => [0x1F64, 0x3B9],
  947. 0x1FA5 => [0x1F65, 0x3B9],
  948. 0x1FA6 => [0x1F66, 0x3B9],
  949. 0x1FA7 => [0x1F67, 0x3B9],
  950. 0x1FA8 => [0x1F60, 0x3B9],
  951. 0x1FA9 => [0x1F61, 0x3B9],
  952. 0x1FAA => [0x1F62, 0x3B9],
  953. 0x1FAB => [0x1F63, 0x3B9],
  954. 0x1FAC => [0x1F64, 0x3B9],
  955. 0x1FAD => [0x1F65, 0x3B9],
  956. 0x1FAE => [0x1F66, 0x3B9],
  957. 0x1FAF => [0x1F67, 0x3B9],
  958. 0x1FB2 => [0x1F70, 0x3B9],
  959. 0x1FB3 => [0x3B1, 0x3B9],
  960. 0x1FB4 => [0x3AC, 0x3B9],
  961. 0x1FB6 => [0x3B1, 0x342],
  962. 0x1FB7 => [0x3B1, 0x342, 0x3B9],
  963. 0x1FB8 => [0x1FB0],
  964. 0x1FB9 => [0x1FB1],
  965. 0x1FBA => [0x1F70],
  966. 0x1FBB => [0x1F71],
  967. 0x1FBC => [0x3B1, 0x3B9],
  968. 0x1FBE => [0x3B9],
  969. 0x1FC2 => [0x1F74, 0x3B9],
  970. 0x1FC3 => [0x3B7, 0x3B9],
  971. 0x1FC4 => [0x3AE, 0x3B9],
  972. 0x1FC6 => [0x3B7, 0x342],
  973. 0x1FC7 => [0x3B7, 0x342, 0x3B9],
  974. 0x1FC8 => [0x1F72],
  975. 0x1FC9 => [0x1F73],
  976. 0x1FCA => [0x1F74],
  977. 0x1FCB => [0x1F75],
  978. 0x1FCC => [0x3B7, 0x3B9],
  979. 0x1FD2 => [0x3B9, 0x308, 0x300],
  980. 0x1FD3 => [0x3B9, 0x308, 0x301],
  981. 0x1FD6 => [0x3B9, 0x342],
  982. 0x1FD7 => [0x3B9, 0x308, 0x342],
  983. 0x1FD8 => [0x1FD0],
  984. 0x1FD9 => [0x1FD1],
  985. 0x1FDA => [0x1F76],
  986. 0x1FDB => [0x1F77],
  987. 0x1FE2 => [0x3C5, 0x308, 0x300],
  988. 0x1FE3 => [0x3C5, 0x308, 0x301],
  989. 0x1FE4 => [0x3C1, 0x313],
  990. 0x1FE6 => [0x3C5, 0x342],
  991. 0x1FE7 => [0x3C5, 0x308, 0x342],
  992. 0x1FE8 => [0x1FE0],
  993. 0x1FE9 => [0x1FE1],
  994. 0x1FEA => [0x1F7A],
  995. 0x1FEB => [0x1F7B],
  996. 0x1FEC => [0x1FE5],
  997. 0x1FF2 => [0x1F7C, 0x3B9],
  998. 0x1FF3 => [0x3C9, 0x3B9],
  999. 0x1FF4 => [0x3CE, 0x3B9],
  1000. 0x1FF6 => [0x3C9, 0x342],
  1001. 0x1FF7 => [0x3C9, 0x342, 0x3B9],
  1002. 0x1FF8 => [0x1F78],
  1003. 0x1FF9 => [0x1F79],
  1004. 0x1FFA => [0x1F7C],
  1005. 0x1FFB => [0x1F7D],
  1006. 0x1FFC => [0x3C9, 0x3B9],
  1007. 0x20A8 => [0x72, 0x73],
  1008. 0x2102 => [0x63],
  1009. 0x2103 => [0xB0, 0x63],
  1010. 0x2107 => [0x25B],
  1011. 0x2109 => [0xB0, 0x66],
  1012. 0x210B => [0x68],
  1013. 0x210C => [0x68],
  1014. 0x210D => [0x68],
  1015. 0x2110 => [0x69],
  1016. 0x2111 => [0x69],
  1017. 0x2112 => [0x6C],
  1018. 0x2115 => [0x6E],
  1019. 0x2116 => [0x6E, 0x6F],
  1020. 0x2119 => [0x70],
  1021. 0x211A => [0x71],
  1022. 0x211B => [0x72],
  1023. 0x211C => [0x72],
  1024. 0x211D => [0x72],
  1025. 0x2120 => [0x73, 0x6D],
  1026. 0x2121 => [0x74, 0x65, 0x6C],
  1027. 0x2122 => [0x74, 0x6D],
  1028. 0x2124 => [0x7A],
  1029. 0x2126 => [0x3C9],
  1030. 0x2128 => [0x7A],
  1031. 0x212A => [0x6B],
  1032. 0x212B => [0xE5],
  1033. 0x212C => [0x62],
  1034. 0x212D => [0x63],
  1035. 0x2130 => [0x65],
  1036. 0x2131 => [0x66],
  1037. 0x2133 => [0x6D],
  1038. 0x213E => [0x3B3],
  1039. 0x213F => [0x3C0],
  1040. 0x2145 => [0x64],
  1041. 0x2160 => [0x2170],
  1042. 0x2161 => [0x2171],
  1043. 0x2162 => [0x2172],
  1044. 0x2163 => [0x2173],
  1045. 0x2164 => [0x2174],
  1046. 0x2165 => [0x2175],
  1047. 0x2166 => [0x2176],
  1048. 0x2167 => [0x2177],
  1049. 0x2168 => [0x2178],
  1050. 0x2169 => [0x2179],
  1051. 0x216A => [0x217A],
  1052. 0x216B => [0x217B],
  1053. 0x216C => [0x217C],
  1054. 0x216D => [0x217D],
  1055. 0x216E => [0x217E],
  1056. 0x216F => [0x217F],
  1057. 0x24B6 => [0x24D0],
  1058. 0x24B7 => [0x24D1],
  1059. 0x24B8 => [0x24D2],
  1060. 0x24B9 => [0x24D3],
  1061. 0x24BA => [0x24D4],
  1062. 0x24BB => [0x24D5],
  1063. 0x24BC => [0x24D6],
  1064. 0x24BD => [0x24D7],
  1065. 0x24BE => [0x24D8],
  1066. 0x24BF => [0x24D9],
  1067. 0x24C0 => [0x24DA],
  1068. 0x24C1 => [0x24DB],
  1069. 0x24C2 => [0x24DC],
  1070. 0x24C3 => [0x24DD],
  1071. 0x24C4 => [0x24DE],
  1072. 0x24C5 => [0x24DF],
  1073. 0x24C6 => [0x24E0],
  1074. 0x24C7 => [0x24E1],
  1075. 0x24C8 => [0x24E2],
  1076. 0x24C9 => [0x24E3],
  1077. 0x24CA => [0x24E4],
  1078. 0x24CB => [0x24E5],
  1079. 0x24CC => [0x24E6],
  1080. 0x24CD => [0x24E7],
  1081. 0x24CE => [0x24E8],
  1082. 0x24CF => [0x24E9],
  1083. 0x3371 => [0x68, 0x70, 0x61],
  1084. 0x3373 => [0x61, 0x75],
  1085. 0x3375 => [0x6F, 0x76],
  1086. 0x3380 => [0x70, 0x61],
  1087. 0x3381 => [0x6E, 0x61],
  1088. 0x3382 => [0x3BC, 0x61],
  1089. 0x3383 => [0x6D, 0x61],
  1090. 0x3384 => [0x6B, 0x61],
  1091. 0x3385 => [0x6B, 0x62],
  1092. 0x3386 => [0x6D, 0x62],
  1093. 0x3387 => [0x67, 0x62],
  1094. 0x338A => [0x70, 0x66],
  1095. 0x338B => [0x6E, 0x66],
  1096. 0x338C => [0x3BC, 0x66],
  1097. 0x3390 => [0x68, 0x7A],
  1098. 0x3391 => [0x6B, 0x68, 0x7A],
  1099. 0x3392 => [0x6D, 0x68, 0x7A],
  1100. 0x3393 => [0x67, 0x68, 0x7A],
  1101. 0x3394 => [0x74, 0x68, 0x7A],
  1102. 0x33A9 => [0x70, 0x61],
  1103. 0x33AA => [0x6B, 0x70, 0x61],
  1104. 0x33AB => [0x6D, 0x70, 0x61],
  1105. 0x33AC => [0x67, 0x70, 0x61],
  1106. 0x33B4 => [0x70, 0x76],
  1107. 0x33B5 => [0x6E, 0x76],
  1108. 0x33B6 => [0x3BC, 0x76],
  1109. 0x33B7 => [0x6D, 0x76],
  1110. 0x33B8 => [0x6B, 0x76],
  1111. 0x33B9 => [0x6D, 0x76],
  1112. 0x33BA => [0x70, 0x77],
  1113. 0x33BB => [0x6E, 0x77],
  1114. 0x33BC => [0x3BC, 0x77],
  1115. 0x33BD => [0x6D, 0x77],
  1116. 0x33BE => [0x6B, 0x77],
  1117. 0x33BF => [0x6D, 0x77],
  1118. 0x33C0 => [0x6B, 0x3C9],
  1119. 0x33C1 => [0x6D, 0x3C9],
  1120. /* 0x33C2 => [0x61, 0x2E, 0x6D, 0x2E], */
  1121. 0x33C3 => [0x62, 0x71],
  1122. 0x33C6 => [0x63, 0x2215, 0x6B, 0x67],
  1123. 0x33C7 => [0x63, 0x6F, 0x2E],
  1124. 0x33C8 => [0x64, 0x62],
  1125. 0x33C9 => [0x67, 0x79],
  1126. 0x33CB => [0x68, 0x70],
  1127. 0x33CD => [0x6B, 0x6B],
  1128. 0x33CE => [0x6B, 0x6D],
  1129. 0x33D7 => [0x70, 0x68],
  1130. 0x33D9 => [0x70, 0x70, 0x6D],
  1131. 0x33DA => [0x70, 0x72],
  1132. 0x33DC => [0x73, 0x76],
  1133. 0x33DD => [0x77, 0x62],
  1134. 0xFB00 => [0x66, 0x66],
  1135. 0xFB01 => [0x66, 0x69],
  1136. 0xFB02 => [0x66, 0x6C],
  1137. 0xFB03 => [0x66, 0x66, 0x69],
  1138. 0xFB04 => [0x66, 0x66, 0x6C],
  1139. 0xFB05 => [0x73, 0x74],
  1140. 0xFB06 => [0x73, 0x74],
  1141. 0xFB13 => [0x574, 0x576],
  1142. 0xFB14 => [0x574, 0x565],
  1143. 0xFB15 => [0x574, 0x56B],
  1144. 0xFB16 => [0x57E, 0x576],
  1145. 0xFB17 => [0x574, 0x56D],
  1146. 0xFF21 => [0xFF41],
  1147. 0xFF22 => [0xFF42],
  1148. 0xFF23 => [0xFF43],
  1149. 0xFF24 => [0xFF44],
  1150. 0xFF25 => [0xFF45],
  1151. 0xFF26 => [0xFF46],
  1152. 0xFF27 => [0xFF47],
  1153. 0xFF28 => [0xFF48],
  1154. 0xFF29 => [0xFF49],
  1155. 0xFF2A => [0xFF4A],
  1156. 0xFF2B => [0xFF4B],
  1157. 0xFF2C => [0xFF4C],
  1158. 0xFF2D => [0xFF4D],
  1159. 0xFF2E => [0xFF4E],
  1160. 0xFF2F => [0xFF4F],
  1161. 0xFF30 => [0xFF50],
  1162. 0xFF31 => [0xFF51],
  1163. 0xFF32 => [0xFF52],
  1164. 0xFF33 => [0xFF53],
  1165. 0xFF34 => [0xFF54],
  1166. 0xFF35 => [0xFF55],
  1167. 0xFF36 => [0xFF56],
  1168. 0xFF37 => [0xFF57],
  1169. 0xFF38 => [0xFF58],
  1170. 0xFF39 => [0xFF59],
  1171. 0xFF3A => [0xFF5A],
  1172. 0x10400 => [0x10428],
  1173. 0x10401 => [0x10429],
  1174. 0x10402 => [0x1042A],
  1175. 0x10403 => [0x1042B],
  1176. 0x10404 => [0x1042C],
  1177. 0x10405 => [0x1042D],
  1178. 0x10406 => [0x1042E],
  1179. 0x10407 => [0x1042F],
  1180. 0x10408 => [0x10430],
  1181. 0x10409 => [0x10431],
  1182. 0x1040A => [0x10432],
  1183. 0x1040B => [0x10433],
  1184. 0x1040C => [0x10434],
  1185. 0x1040D => [0x10435],
  1186. 0x1040E => [0x10436],
  1187. 0x1040F => [0x10437],
  1188. 0x10410 => [0x10438],
  1189. 0x10411 => [0x10439],
  1190. 0x10412 => [0x1043A],
  1191. 0x10413 => [0x1043B],
  1192. 0x10414 => [0x1043C],
  1193. 0x10415 => [0x1043D],
  1194. 0x10416 => [0x1043E],
  1195. 0x10417 => [0x1043F],
  1196. 0x10418 => [0x10440],
  1197. 0x10419 => [0x10441],
  1198. 0x1041A => [0x10442],
  1199. 0x1041B => [0x10443],
  1200. 0x1041C => [0x10444],
  1201. 0x1041D => [0x10445],
  1202. 0x1041E => [0x10446],
  1203. 0x1041F => [0x10447],
  1204. 0x10420 => [0x10448],
  1205. 0x10421 => [0x10449],
  1206. 0x10422 => [0x1044A],
  1207. 0x10423 => [0x1044B],
  1208. 0x10424 => [0x1044C],
  1209. 0x10425 => [0x1044D],
  1210. 0x1D400 => [0x61],
  1211. 0x1D401 => [0x62],
  1212. 0x1D402 => [0x63],
  1213. 0x1D403 => [0x64],
  1214. 0x1D404 => [0x65],
  1215. 0x1D405 => [0x66],
  1216. 0x1D406 => [0x67],
  1217. 0x1D407 => [0x68],
  1218. 0x1D408 => [0x69],
  1219. 0x1D409 => [0x6A],
  1220. 0x1D40A => [0x6B],
  1221. 0x1D40B => [0x6C],
  1222. 0x1D40C => [0x6D],
  1223. 0x1D40D => [0x6E],
  1224. 0x1D40E => [0x6F],
  1225. 0x1D40F => [0x70],
  1226. 0x1D410 => [0x71],
  1227. 0x1D411 => [0x72],
  1228. 0x1D412 => [0x73],
  1229. 0x1D413 => [0x74],
  1230. 0x1D414 => [0x75],
  1231. 0x1D415 => [0x76],
  1232. 0x1D416 => [0x77],
  1233. 0x1D417 => [0x78],
  1234. 0x1D418 => [0x79],
  1235. 0x1D419 => [0x7A],
  1236. 0x1D434 => [0x61],
  1237. 0x1D435 => [0x62],
  1238. 0x1D436 => [0x63],
  1239. 0x1D437 => [0x64],
  1240. 0x1D438 => [0x65],
  1241. 0x1D439 => [0x66],
  1242. 0x1D43A => [0x67],
  1243. 0x1D43B => [0x68],
  1244. 0x1D43C => [0x69],
  1245. 0x1D43D => [0x6A],
  1246. 0x1D43E => [0x6B],
  1247. 0x1D43F => [0x6C],
  1248. 0x1D440 => [0x6D],
  1249. 0x1D441 => [0x6E],
  1250. 0x1D442 => [0x6F],
  1251. 0x1D443 => [0x70],
  1252. 0x1D444 => [0x71],
  1253. 0x1D445 => [0x72],
  1254. 0x1D446 => [0x73],
  1255. 0x1D447 => [0x74],
  1256. 0x1D448 => [0x75],
  1257. 0x1D449 => [0x76],
  1258. 0x1D44A => [0x77],
  1259. 0x1D44B => [0x78],
  1260. 0x1D44C => [0x79],
  1261. 0x1D44D => [0x7A],
  1262. 0x1D468 => [0x61],
  1263. 0x1D469 => [0x62],
  1264. 0x1D46A => [0x63],
  1265. 0x1D46B => [0x64],
  1266. 0x1D46C => [0x65],
  1267. 0x1D46D => [0x66],
  1268. 0x1D46E => [0x67],
  1269. 0x1D46F => [0x68],
  1270. 0x1D470 => [0x69],
  1271. 0x1D471 => [0x6A],
  1272. 0x1D472 => [0x6B],
  1273. 0x1D473 => [0x6C],
  1274. 0x1D474 => [0x6D],
  1275. 0x1D475 => [0x6E],
  1276. 0x1D476 => [0x6F],
  1277. 0x1D477 => [0x70],
  1278. 0x1D478 => [0x71],
  1279. 0x1D479 => [0x72],
  1280. 0x1D47A => [0x73],
  1281. 0x1D47B => [0x74],
  1282. 0x1D47C => [0x75],
  1283. 0x1D47D => [0x76],
  1284. 0x1D47E => [0x77],
  1285. 0x1D47F => [0x78],
  1286. 0x1D480 => [0x79],
  1287. 0x1D481 => [0x7A],
  1288. 0x1D49C => [0x61],
  1289. 0x1D49E => [0x63],
  1290. 0x1D49F => [0x64],
  1291. 0x1D4A2 => [0x67],
  1292. 0x1D4A5 => [0x6A],
  1293. 0x1D4A6 => [0x6B],
  1294. 0x1D4A9 => [0x6E],
  1295. 0x1D4AA => [0x6F],
  1296. 0x1D4AB => [0x70],
  1297. 0x1D4AC => [0x71],
  1298. 0x1D4AE => [0x73],
  1299. 0x1D4AF => [0x74],
  1300. 0x1D4B0 => [0x75],
  1301. 0x1D4B1 => [0x76],
  1302. 0x1D4B2 => [0x77],
  1303. 0x1D4B3 => [0x78],
  1304. 0x1D4B4 => [0x79],
  1305. 0x1D4B5 => [0x7A],
  1306. 0x1D4D0 => [0x61],
  1307. 0x1D4D1 => [0x62],
  1308. 0x1D4D2 => [0x63],
  1309. 0x1D4D3 => [0x64],
  1310. 0x1D4D4 => [0x65],
  1311. 0x1D4D5 => [0x66],
  1312. 0x1D4D6 => [0x67],
  1313. 0x1D4D7 => [0x68],
  1314. 0x1D4D8 => [0x69],
  1315. 0x1D4D9 => [0x6A],
  1316. 0x1D4DA => [0x6B],
  1317. 0x1D4DB => [0x6C],
  1318. 0x1D4DC => [0x6D],
  1319. 0x1D4DD => [0x6E],
  1320. 0x1D4DE => [0x6F],
  1321. 0x1D4DF => [0x70],
  1322. 0x1D4E0 => [0x71],
  1323. 0x1D4E1 => [0x72],
  1324. 0x1D4E2 => [0x73],
  1325. 0x1D4E3 => [0x74],
  1326. 0x1D4E4 => [0x75],
  1327. 0x1D4E5 => [0x76],
  1328. 0x1D4E6 => [0x77],
  1329. 0x1D4E7 => [0x78],
  1330. 0x1D4E8 => [0x79],
  1331. 0x1D4E9 => [0x7A],
  1332. 0x1D504 => [0x61],
  1333. 0x1D505 => [0x62],
  1334. 0x1D507 => [0x64],
  1335. 0x1D508 => [0x65],
  1336. 0x1D509 => [0x66],
  1337. 0x1D50A => [0x67],
  1338. 0x1D50D => [0x6A],
  1339. 0x1D50E => [0x6B],
  1340. 0x1D50F => [0x6C],
  1341. 0x1D510 => [0x6D],
  1342. 0x1D511 => [0x6E],
  1343. 0x1D512 => [0x6F],
  1344. 0x1D513 => [0x70],
  1345. 0x1D514 => [0x71],
  1346. 0x1D516 => [0x73],
  1347. 0x1D517 => [0x74],
  1348. 0x1D518 => [0x75],
  1349. 0x1D519 => [0x76],
  1350. 0x1D51A => [0x77],
  1351. 0x1D51B => [0x78],
  1352. 0x1D51C => [0x79],
  1353. 0x1D538 => [0x61],
  1354. 0x1D539 => [0x62],
  1355. 0x1D53B => [0x64],
  1356. 0x1D53C => [0x65],
  1357. 0x1D53D => [0x66],
  1358. 0x1D53E => [0x67],
  1359. 0x1D540 => [0x69],
  1360. 0x1D541 => [0x6A],
  1361. 0x1D542 => [0x6B],
  1362. 0x1D543 => [0x6C],
  1363. 0x1D544 => [0x6D],
  1364. 0x1D546 => [0x6F],
  1365. 0x1D54A => [0x73],
  1366. 0x1D54B => [0x74],
  1367. 0x1D54C => [0x75],
  1368. 0x1D54D => [0x76],
  1369. 0x1D54E => [0x77],
  1370. 0x1D54F => [0x78],
  1371. 0x1D550 => [0x79],
  1372. 0x1D56C => [0x61],
  1373. 0x1D56D => [0x62],
  1374. 0x1D56E => [0x63],
  1375. 0x1D56F => [0x64],
  1376. 0x1D570 => [0x65],
  1377. 0x1D571 => [0x66],
  1378. 0x1D572 => [0x67],
  1379. 0x1D573 => [0x68],
  1380. 0x1D574 => [0x69],
  1381. 0x1D575 => [0x6A],
  1382. 0x1D576 => [0x6B],
  1383. 0x1D577 => [0x6C],
  1384. 0x1D578 => [0x6D],
  1385. 0x1D579 => [0x6E],
  1386. 0x1D57A => [0x6F],
  1387. 0x1D57B => [0x70],
  1388. 0x1D57C => [0x71],
  1389. 0x1D57D => [0x72],
  1390. 0x1D57E => [0x73],
  1391. 0x1D57F => [0x74],
  1392. 0x1D580 => [0x75],
  1393. 0x1D581 => [0x76],
  1394. 0x1D582 => [0x77],
  1395. 0x1D583 => [0x78],
  1396. 0x1D584 => [0x79],
  1397. 0x1D585 => [0x7A],
  1398. 0x1D5A0 => [0x61],
  1399. 0x1D5A1 => [0x62],
  1400. 0x1D5A2 => [0x63],
  1401. 0x1D5A3 => [0x64],
  1402. 0x1D5A4 => [0x65],
  1403. 0x1D5A5 => [0x66],
  1404. 0x1D5A6 => [0x67],
  1405. 0x1D5A7 => [0x68],
  1406. 0x1D5A8 => [0x69],
  1407. 0x1D5A9 => [0x6A],
  1408. 0x1D5AA => [0x6B],
  1409. 0x1D5AB => [0x6C],
  1410. 0x1D5AC => [0x6D],
  1411. 0x1D5AD => [0x6E],
  1412. 0x1D5AE => [0x6F],
  1413. 0x1D5AF => [0x70],
  1414. 0x1D5B0 => [0x71],
  1415. 0x1D5B1 => [0x72],
  1416. 0x1D5B2 => [0x73],
  1417. 0x1D5B3 => [0x74],
  1418. 0x1D5B4 => [0x75],
  1419. 0x1D5B5 => [0x76],
  1420. 0x1D5B6 => [0x77],
  1421. 0x1D5B7 => [0x78],
  1422. 0x1D5B8 => [0x79],
  1423. 0x1D5B9 => [0x7A],
  1424. 0x1D5D4 => [0x61],
  1425. 0x1D5D5 => [0x62],
  1426. 0x1D5D6 => [0x63],
  1427. 0x1D5D7 => [0x64],
  1428. 0x1D5D8 => [0x65],
  1429. 0x1D5D9 => [0x66],
  1430. 0x1D5DA => [0x67],
  1431. 0x1D5DB => [0x68],
  1432. 0x1D5DC => [0x69],
  1433. 0x1D5DD => [0x6A],
  1434. 0x1D5DE => [0x6B],
  1435. 0x1D5DF => [0x6C],
  1436. 0x1D5E0 => [0x6D],
  1437. 0x1D5E1 => [0x6E],
  1438. 0x1D5E2 => [0x6F],
  1439. 0x1D5E3 => [0x70],
  1440. 0x1D5E4 => [0x71],
  1441. 0x1D5E5 => [0x72],
  1442. 0x1D5E6 => [0x73],
  1443. 0x1D5E7 => [0x74],
  1444. 0x1D5E8 => [0x75],
  1445. 0x1D5E9 => [0x76],
  1446. 0x1D5EA => [0x77],
  1447. 0x1D5EB => [0x78],
  1448. 0x1D5EC => [0x79],
  1449. 0x1D5ED => [0x7A],
  1450. 0x1D608 => [0x61],
  1451. 0x1D609 => [0x62],
  1452. 0x1D60A => [0x63],
  1453. 0x1D60B => [0x64],
  1454. 0x1D60C => [0x65],
  1455. 0x1D60D => [0x66],
  1456. 0x1D60E => [0x67],
  1457. 0x1D60F => [0x68],
  1458. 0x1D610 => [0x69],
  1459. 0x1D611 => [0x6A],
  1460. 0x1D612 => [0x6B],
  1461. 0x1D613 => [0x6C],
  1462. 0x1D614 => [0x6D],
  1463. 0x1D615 => [0x6E],
  1464. 0x1D616 => [0x6F],
  1465. 0x1D617 => [0x70],
  1466. 0x1D618 => [0x71],
  1467. 0x1D619 => [0x72],
  1468. 0x1D61A => [0x73],
  1469. 0x1D61B => [0x74],
  1470. 0x1D61C => [0x75],
  1471. 0x1D61D => [0x76],
  1472. 0x1D61E => [0x77],
  1473. 0x1D61F => [0x78],
  1474. 0x1D620 => [0x79],
  1475. 0x1D621 => [0x7A],
  1476. 0x1D63C => [0x61],
  1477. 0x1D63D => [0x62],
  1478. 0x1D63E => [0x63],
  1479. 0x1D63F => [0x64],
  1480. 0x1D640 => [0x65],
  1481. 0x1D641 => [0x66],
  1482. 0x1D642 => [0x67],
  1483. 0x1D643 => [0x68],
  1484. 0x1D644 => [0x69],
  1485. 0x1D645 => [0x6A],
  1486. 0x1D646 => [0x6B],
  1487. 0x1D647 => [0x6C],
  1488. 0x1D648 => [0x6D],
  1489. 0x1D649 => [0x6E],
  1490. 0x1D64A => [0x6F],
  1491. 0x1D64B => [0x70],
  1492. 0x1D64C => [0x71],
  1493. 0x1D64D => [0x72],
  1494. 0x1D64E => [0x73],
  1495. 0x1D64F => [0x74],
  1496. 0x1D650 => [0x75],
  1497. 0x1D651 => [0x76],
  1498. 0x1D652 => [0x77],
  1499. 0x1D653 => [0x78],
  1500. 0x1D654 => [0x79],
  1501. 0x1D655 => [0x7A],
  1502. 0x1D670 => [0x61],
  1503. 0x1D671 => [0x62],
  1504. 0x1D672 => [0x63],
  1505. 0x1D673 => [0x64],
  1506. 0x1D674 => [0x65],
  1507. 0x1D675 => [0x66],
  1508. 0x1D676 => [0x67],
  1509. 0x1D677 => [0x68],
  1510. 0x1D678 => [0x69],
  1511. 0x1D679 => [0x6A],
  1512. 0x1D67A => [0x6B],
  1513. 0x1D67B => [0x6C],
  1514. 0x1D67C => [0x6D],
  1515. 0x1D67D => [0x6E],
  1516. 0x1D67E => [0x6F],
  1517. 0x1D67F => [0x70],
  1518. 0x1D680 => [0x71],
  1519. 0x1D681 => [0x72],
  1520. 0x1D682 => [0x73],
  1521. 0x1D683 => [0x74],
  1522. 0x1D684 => [0x75],
  1523. 0x1D685 => [0x76],
  1524. 0x1D686 => [0x77],
  1525. 0x1D687 => [0x78],
  1526. 0x1D688 => [0x79],
  1527. 0x1D689 => [0x7A],
  1528. 0x1D6A8 => [0x3B1],
  1529. 0x1D6A9 => [0x3B2],
  1530. 0x1D6AA => [0x3B3],
  1531. 0x1D6AB => [0x3B4],
  1532. 0x1D6AC => [0x3B5],
  1533. 0x1D6AD => [0x3B6],
  1534. 0x1D6AE => [0x3B7],
  1535. 0x1D6AF => [0x3B8],
  1536. 0x1D6B0 => [0x3B9],
  1537. 0x1D6B1 => [0x3BA],
  1538. 0x1D6B2 => [0x3BB],
  1539. 0x1D6B3 => [0x3BC],
  1540. 0x1D6B4 => [0x3BD],
  1541. 0x1D6B5 => [0x3BE],
  1542. 0x1D6B6 => [0x3BF],
  1543. 0x1D6B7 => [0x3C0],
  1544. 0x1D6B8 => [0x3C1],
  1545. 0x1D6B9 => [0x3B8],
  1546. 0x1D6BA => [0x3C3],
  1547. 0x1D6BB => [0x3C4],
  1548. 0x1D6BC => [0x3C5],
  1549. 0x1D6BD => [0x3C6],
  1550. 0x1D6BE => [0x3C7],
  1551. 0x1D6BF => [0x3C8],
  1552. 0x1D6C0 => [0x3C9],
  1553. 0x1D6D3 => [0x3C3],
  1554. 0x1D6E2 => [0x3B1],
  1555. 0x1D6E3 => [0x3B2],
  1556. 0x1D6E4 => [0x3B3],
  1557. 0x1D6E5 => [0x3B4],
  1558. 0x1D6E6 => [0x3B5],
  1559. 0x1D6E7 => [0x3B6],
  1560. 0x1D6E8 => [0x3B7],
  1561. 0x1D6E9 => [0x3B8],
  1562. 0x1D6EA => [0x3B9],
  1563. 0x1D6EB => [0x3BA],
  1564. 0x1D6EC => [0x3BB],
  1565. 0x1D6ED => [0x3BC],
  1566. 0x1D6EE => [0x3BD],
  1567. 0x1D6EF => [0x3BE],
  1568. 0x1D6F0 => [0x3BF],
  1569. 0x1D6F1 => [0x3C0],
  1570. 0x1D6F2 => [0x3C1],
  1571. 0x1D6F3 => [0x3B8],
  1572. 0x1D6F4 => [0x3C3],
  1573. 0x1D6F5 => [0x3C4],
  1574. 0x1D6F6 => [0x3C5],
  1575. 0x1D6F7 => [0x3C6],
  1576. 0x1D6F8 => [0x3C7],
  1577. 0x1D6F9 => [0x3C8],
  1578. 0x1D6FA => [0x3C9],
  1579. 0x1D70D => [0x3C3],
  1580. 0x1D71C => [0x3B1],
  1581. 0x1D71D => [0x3B2],
  1582. 0x1D71E => [0x3B3],
  1583. 0x1D71F => [0x3B4],
  1584. 0x1D720 => [0x3B5],
  1585. 0x1D721 => [0x3B6],
  1586. 0x1D722 => [0x3B7],
  1587. 0x1D723 => [0x3B8],
  1588. 0x1D724 => [0x3B9],
  1589. 0x1D725 => [0x3BA],
  1590. 0x1D726 => [0x3BB],
  1591. 0x1D727 => [0x3BC],
  1592. 0x1D728 => [0x3BD],
  1593. 0x1D729 => [0x3BE],
  1594. 0x1D72A => [0x3BF],
  1595. 0x1D72B => [0x3C0],
  1596. 0x1D72C => [0x3C1],
  1597. 0x1D72D => [0x3B8],
  1598. 0x1D72E => [0x3C3],
  1599. 0x1D72F => [0x3C4],
  1600. 0x1D730 => [0x3C5],
  1601. 0x1D731 => [0x3C6],
  1602. 0x1D732 => [0x3C7],
  1603. 0x1D733 => [0x3C8],
  1604. 0x1D734 => [0x3C9],
  1605. 0x1D747 => [0x3C3],
  1606. 0x1D756 => [0x3B1],
  1607. 0x1D757 => [0x3B2],
  1608. 0x1D758 => [0x3B3],
  1609. 0x1D759 => [0x3B4],
  1610. 0x1D75A => [0x3B5],
  1611. 0x1D75B => [0x3B6],
  1612. 0x1D75C => [0x3B7],
  1613. 0x1D75D => [0x3B8],
  1614. 0x1D75E => [0x3B9],
  1615. 0x1D75F => [0x3BA],
  1616. 0x1D760 => [0x3BB],
  1617. 0x1D761 => [0x3BC],
  1618. 0x1D762 => [0x3BD],
  1619. 0x1D763 => [0x3BE],
  1620. 0x1D764 => [0x3BF],
  1621. 0x1D765 => [0x3C0],
  1622. 0x1D766 => [0x3C1],
  1623. 0x1D767 => [0x3B8],
  1624. 0x1D768 => [0x3C3],
  1625. 0x1D769 => [0x3C4],
  1626. 0x1D76A => [0x3C5],
  1627. 0x1D76B => [0x3C6],
  1628. 0x1D76C => [0x3C7],
  1629. 0x1D76D => [0x3C8],
  1630. 0x1D76E => [0x3C9],
  1631. 0x1D781 => [0x3C3],
  1632. 0x1D790 => [0x3B1],
  1633. 0x1D791 => [0x3B2],
  1634. 0x1D792 => [0x3B3],
  1635. 0x1D793 => [0x3B4],
  1636. 0x1D794 => [0x3B5],
  1637. 0x1D795 => [0x3B6],
  1638. 0x1D796 => [0x3B7],
  1639. 0x1D797 => [0x3B8],
  1640. 0x1D798 => [0x3B9],
  1641. 0x1D799 => [0x3BA],
  1642. 0x1D79A => [0x3BB],
  1643. 0x1D79B => [0x3BC],
  1644. 0x1D79C => [0x3BD],
  1645. 0x1D79D => [0x3BE],
  1646. 0x1D79E => [0x3BF],
  1647. 0x1D79F => [0x3C0],
  1648. 0x1D7A0 => [0x3C1],
  1649. 0x1D7A1 => [0x3B8],
  1650. 0x1D7A2 => [0x3C3],
  1651. 0x1D7A3 => [0x3C4],
  1652. 0x1D7A4 => [0x3C5],
  1653. 0x1D7A5 => [0x3C6],
  1654. 0x1D7A6 => [0x3C7],
  1655. 0x1D7A7 => [0x3C8],
  1656. 0x1D7A8 => [0x3C9],
  1657. 0x1D7BB => [0x3C3],
  1658. 0x3F9 => [0x3C3],
  1659. 0x1D2C => [0x61],
  1660. 0x1D2D => [0xE6],
  1661. 0x1D2E => [0x62],
  1662. 0x1D30 => [0x64],
  1663. 0x1D31 => [0x65],
  1664. 0x1D32 => [0x1DD],
  1665. 0x1D33 => [0x67],
  1666. 0x1D34 => [0x68],
  1667. 0x1D35 => [0x69],
  1668. 0x1D36 => [0x6A],
  1669. 0x1D37 => [0x6B],
  1670. 0x1D38 => [0x6C],
  1671. 0x1D39 => [0x6D],
  1672. 0x1D3A => [0x6E],
  1673. 0x1D3C => [0x6F],
  1674. 0x1D3D => [0x223],
  1675. 0x1D3E => [0x70],
  1676. 0x1D3F => [0x72],
  1677. 0x1D40 => [0x74],
  1678. 0x1D41 => [0x75],
  1679. 0x1D42 => [0x77],
  1680. 0x213B => [0x66, 0x61, 0x78],
  1681. 0x3250 => [0x70, 0x74, 0x65],
  1682. 0x32CC => [0x68, 0x67],
  1683. 0x32CE => [0x65, 0x76],
  1684. 0x32CF => [0x6C, 0x74, 0x64],
  1685. 0x337A => [0x69, 0x75],
  1686. 0x33DE => [0x76, 0x2215, 0x6D],
  1687. 0x33DF => [0x61, 0x2215, 0x6D]
  1688. ];
  1689. /**
  1690. * Normalization Combining Classes; Code Points not listed
  1691. * got Combining Class 0.
  1692. *
  1693. * @static
  1694. * @var array
  1695. * @access private
  1696. */
  1697. private static $_np_norm_combcls = [
  1698. 0x334 => 1,
  1699. 0x335 => 1,
  1700. 0x336 => 1,
  1701. 0x337 => 1,
  1702. 0x338 => 1,
  1703. 0x93C => 7,
  1704. 0x9BC => 7,
  1705. 0xA3C => 7,
  1706. 0xABC => 7,
  1707. 0xB3C => 7,
  1708. 0xCBC => 7,
  1709. 0x1037 => 7,
  1710. 0x3099 => 8,
  1711. 0x309A => 8,
  1712. 0x94D => 9,
  1713. 0x9CD => 9,
  1714. 0xA4D => 9,
  1715. 0xACD => 9,
  1716. 0xB4D => 9,
  1717. 0xBCD => 9,
  1718. 0xC4D => 9,
  1719. 0xCCD => 9,
  1720. 0xD4D => 9,
  1721. 0xDCA => 9,
  1722. 0xE3A => 9,
  1723. 0xF84 => 9,
  1724. 0x1039 => 9,
  1725. 0x1714 => 9,
  1726. 0x1734 => 9,
  1727. 0x17D2 => 9,
  1728. 0x5B0 => 10,
  1729. 0x5B1 => 11,
  1730. 0x5B2 => 12,
  1731. 0x5B3 => 13,
  1732. 0x5B4 => 14,
  1733. 0x5B5 => 15,
  1734. 0x5B6 => 16,
  1735. 0x5B7 => 17,
  1736. 0x5B8 => 18,
  1737. 0x5B9 => 19,
  1738. 0x5BB => 20,
  1739. 0x5Bc => 21,
  1740. 0x5BD => 22,
  1741. 0x5BF => 23,
  1742. 0x5C1 => 24,
  1743. 0x5C2 => 25,
  1744. 0xFB1E => 26,
  1745. 0x64B => 27,
  1746. 0x64C => 28,
  1747. 0x64D => 29,
  1748. 0x64E => 30,
  1749. 0x64F => 31,
  1750. 0x650 => 32,
  1751. 0x651 => 33,
  1752. 0x652 => 34,
  1753. 0x670 => 35,
  1754. 0x711 => 36,
  1755. 0xC55 => 84,
  1756. 0xC56 => 91,
  1757. 0xE38 => 103,
  1758. 0xE39 => 103,
  1759. 0xE48 => 107,
  1760. 0xE49 => 107,
  1761. 0xE4A => 107,
  1762. 0xE4B => 107,
  1763. 0xEB8 => 118,
  1764. 0xEB9 => 118,
  1765. 0xEC8 => 122,
  1766. 0xEC9 => 122,
  1767. 0xECA => 122,
  1768. 0xECB => 122,
  1769. 0xF71 => 129,
  1770. 0xF72 => 130,
  1771. 0xF7A => 130,
  1772. 0xF7B => 130,
  1773. 0xF7C => 130,
  1774. 0xF7D => 130,
  1775. 0xF80 => 130,
  1776. 0xF74 => 132,
  1777. 0x321 => 202,
  1778. 0x322 => 202,
  1779. 0x327 => 202,
  1780. 0x328 => 202,
  1781. 0x31B => 216,
  1782. 0xF39 => 216,
  1783. 0x1D165 => 216,
  1784. 0x1D166 => 216,
  1785. 0x1D16E => 216,
  1786. 0x1D16F => 216,
  1787. 0x1D170 => 216,
  1788. 0x1D171 => 216,
  1789. 0x1D172 => 216,
  1790. 0x302A => 218,
  1791. 0x316 => 220,
  1792. 0x317 => 220,
  1793. 0x318 => 220,
  1794. 0x319 => 220,
  1795. 0x31C => 220,
  1796. 0x31D => 220,
  1797. 0x31E => 220,
  1798. 0x31F => 220,
  1799. 0x320 => 220,
  1800. 0x323 => 220,
  1801. 0x324 => 220,
  1802. 0x325 => 220,
  1803. 0x326 => 220,
  1804. 0x329 => 220,
  1805. 0x32A => 220,
  1806. 0x32B => 220,
  1807. 0x32C => 220,
  1808. 0x32D => 220,
  1809. 0x32E => 220,
  1810. 0x32F => 220,
  1811. 0x330 => 220,
  1812. 0x331 => 220,
  1813. 0x332 => 220,
  1814. 0x333 => 220,
  1815. 0x339 => 220,
  1816. 0x33A => 220,
  1817. 0x33B => 220,
  1818. 0x33C => 220,
  1819. 0x347 => 220,
  1820. 0x348 => 220,
  1821. 0x349 => 220,
  1822. 0x34D => 220,
  1823. 0x34E => 220,
  1824. 0x353 => 220,
  1825. 0x354 => 220,
  1826. 0x355 => 220,
  1827. 0x356 => 220,
  1828. 0x591 => 220,
  1829. 0x596 => 220,
  1830. 0x59B => 220,
  1831. 0x5A3 => 220,
  1832. 0x5A4 => 220,
  1833. 0x5A5 => 220,
  1834. 0x5A6 => 220,
  1835. 0x5A7 => 220,
  1836. 0x5AA => 220,
  1837. 0x655 => 220,
  1838. 0x656 => 220,
  1839. 0x6E3 => 220,
  1840. 0x6EA => 220,
  1841. 0x6ED => 220,
  1842. 0x731 => 220,
  1843. 0x734 => 220,
  1844. 0x737 => 220,
  1845. 0x738 => 220,
  1846. 0x739 => 220,
  1847. 0x73B => 220,
  1848. 0x73C => 220,
  1849. 0x73E => 220,
  1850. 0x742 => 220,
  1851. 0x744 => 220,
  1852. 0x746 => 220,
  1853. 0x748 => 220,
  1854. 0x952 => 220,
  1855. 0xF18 => 220,
  1856. 0xF19 => 220,
  1857. 0xF35 => 220,
  1858. 0xF37 => 220,
  1859. 0xFC6 => 220,
  1860. 0x193B => 220,
  1861. 0x20E8 => 220,
  1862. 0x1D17B => 220,
  1863. 0x1D17C => 220,
  1864. 0x1D17D => 220,
  1865. 0x1D17E => 220,
  1866. 0x1D17F => 220,
  1867. 0x1D180 => 220,
  1868. 0x1D181 => 220,
  1869. 0x1D182 => 220,
  1870. 0x1D18A => 220,
  1871. 0x1D18B => 220,
  1872. 0x59A => 222,
  1873. 0x5AD => 222,
  1874. 0x1929 => 222,
  1875. 0x302D => 222,
  1876. 0x302E => 224,
  1877. 0x302F => 224,
  1878. 0x1D16D => 226,
  1879. 0x5AE => 228,
  1880. 0x18A9 => 228,
  1881. 0x302B => 228,
  1882. 0x300 => 230,
  1883. 0x301 => 230,
  1884. 0x302 => 230,
  1885. 0x303 => 230,
  1886. 0x304 => 230,
  1887. 0x305 => 230,
  1888. 0x306 => 230,
  1889. 0x307 => 230,
  1890. 0x308 => 230,
  1891. 0x309 => 230,
  1892. 0x30A => 230,
  1893. 0x30B => 230,
  1894. 0x30C => 230,
  1895. 0x30D => 230,
  1896. 0x30E => 230,
  1897. 0x30F => 230,
  1898. 0x310 => 230,
  1899. 0x311 => 230,
  1900. 0x312 => 230,
  1901. 0x313 => 230,
  1902. 0x314 => 230,
  1903. 0x33D => 230,
  1904. 0x33E => 230,
  1905. 0x33F => 230,
  1906. 0x340 => 230,
  1907. 0x341 => 230,
  1908. 0x342 => 230,
  1909. 0x343 => 230,
  1910. 0x344 => 230,
  1911. 0x346 => 230,
  1912. 0x34A => 230,
  1913. 0x34B => 230,
  1914. 0x34C => 230,
  1915. 0x350 => 230,
  1916. 0x351 => 230,
  1917. 0x352 => 230,
  1918. 0x357 => 230,
  1919. 0x363 => 230,
  1920. 0x364 => 230,
  1921. 0x365 => 230,
  1922. 0x366 => 230,
  1923. 0x367 => 230,
  1924. 0x368 => 230,
  1925. 0x369 => 230,
  1926. 0x36A => 230,
  1927. 0x36B => 230,
  1928. 0x36C => 230,
  1929. 0x36D => 230,
  1930. 0x36E => 230,
  1931. 0x36F => 230,
  1932. 0x483 => 230,
  1933. 0x484 => 230,
  1934. 0x485 => 230,
  1935. 0x486 => 230,
  1936. 0x592 => 230,
  1937. 0x593 => 230,
  1938. 0x594 => 230,
  1939. 0x595 => 230,
  1940. 0x597 => 230,
  1941. 0x598 => 230,
  1942. 0x599 => 230,
  1943. 0x59C => 230,
  1944. 0x59D => 230,
  1945. 0x59E => 230,
  1946. 0x59F => 230,
  1947. 0x5A0 => 230,
  1948. 0x5A1 => 230,
  1949. 0x5A8 => 230,
  1950. 0x5A9 => 230,
  1951. 0x5AB => 230,
  1952. 0x5AC => 230,
  1953. 0x5AF => 230,
  1954. 0x5C4 => 230,
  1955. 0x610 => 230,
  1956. 0x611 => 230,
  1957. 0x612 => 230,
  1958. 0x613 => 230,
  1959. 0x614 => 230,
  1960. 0x615 => 230,
  1961. 0x653 => 230,
  1962. 0x654 => 230,
  1963. 0x657 => 230,
  1964. 0x658 => 230,
  1965. 0x6D6 => 230,
  1966. 0x6D7 => 230,
  1967. 0x6D8 => 230,
  1968. 0x6D9 => 230,
  1969. 0x6DA => 230,
  1970. 0x6DB => 230,
  1971. 0x6DC => 230,
  1972. 0x6DF => 230,
  1973. 0x6E0 => 230,
  1974. 0x6E1 => 230,
  1975. 0x6E2 => 230,
  1976. 0x6E4 => 230,
  1977. 0x6E7 => 230,
  1978. 0x6E8 => 230,
  1979. 0x6EB => 230,
  1980. 0x6EC => 230,
  1981. 0x730 => 230,
  1982. 0x732 => 230,
  1983. 0x733 => 230,
  1984. 0x735 => 230,
  1985. 0x736 => 230,
  1986. 0x73A => 230,
  1987. 0x73D => 230,
  1988. 0x73F => 230,
  1989. 0x740 => 230,
  1990. 0x741 => 230,
  1991. 0x743 => 230,
  1992. 0x745 => 230,
  1993. 0x747 => 230,
  1994. 0x749 => 230,
  1995. 0x74A => 230,
  1996. 0x951 => 230,
  1997. 0x953 => 230,
  1998. 0x954 => 230,
  1999. 0xF82 => 230,
  2000. 0xF83 => 230,
  2001. 0xF86 => 230,
  2002. 0xF87 => 230,
  2003. 0x170D => 230,
  2004. 0x193A => 230,
  2005. 0x20D0 => 230,
  2006. 0x20D1 => 230,
  2007. 0x20D4 => 230,
  2008. 0x20D5 => 230,
  2009. 0x20D6 => 230,
  2010. 0x20D7 => 230,
  2011. 0x20DB => 230,
  2012. 0x20DC => 230,
  2013. 0x20E1 => 230,
  2014. 0x20E7 => 230,
  2015. 0x20E9 => 230,
  2016. 0xFE20 => 230,
  2017. 0xFE21 => 230,
  2018. 0xFE22 => 230,
  2019. 0xFE23 => 230,
  2020. 0x1D185 => 230,
  2021. 0x1D186 => 230,
  2022. 0x1D187 => 230,
  2023. 0x1D189 => 230,
  2024. 0x1D188 => 230,
  2025. 0x1D1AA => 230,
  2026. 0x1D1AB => 230,
  2027. 0x1D1AC => 230,
  2028. 0x1D1AD => 230,
  2029. 0x315 => 232,
  2030. 0x31A => 232,
  2031. 0x302C => 232,
  2032. 0x35F => 233,
  2033. 0x362 => 233,
  2034. 0x35D => 234,
  2035. 0x35E => 234,
  2036. 0x360 => 234,
  2037. 0x361 => 234,
  2038. 0x345 => 240
  2039. ];
  2040. // }}}
  2041. // {{{ properties
  2042. /**
  2043. * @var string
  2044. * @access private
  2045. */
  2046. private $_punycode_prefix = 'xn--';
  2047. /**
  2048. * @access private
  2049. */
  2050. private $_invalid_ucs = 0x80000000;
  2051. /**
  2052. * @access private
  2053. */
  2054. private $_max_ucs = 0x10FFFF;
  2055. /**
  2056. * @var int
  2057. * @access private
  2058. */
  2059. private $_base = 36;
  2060. /**
  2061. * @var int
  2062. * @access private
  2063. */
  2064. private $_tmin = 1;
  2065. /**
  2066. * @var int
  2067. * @access private
  2068. */
  2069. private $_tmax = 26;
  2070. /**
  2071. * @var int
  2072. * @access private
  2073. */
  2074. private $_skew = 38;
  2075. /**
  2076. * @var int
  2077. * @access private
  2078. */
  2079. private $_damp = 700;
  2080. /**
  2081. * @var int
  2082. * @access private
  2083. */
  2084. private $_initial_bias = 72;
  2085. /**
  2086. * @var int
  2087. * @access private
  2088. */
  2089. private $_initial_n = 0x80;
  2090. /**
  2091. * @var int
  2092. * @access private
  2093. */
  2094. private $_slast;
  2095. /**
  2096. * @access private
  2097. */
  2098. private $_sbase = 0xAC00;
  2099. /**
  2100. * @access private
  2101. */
  2102. private $_lbase = 0x1100;
  2103. /**
  2104. * @access private
  2105. */
  2106. private $_vbase = 0x1161;
  2107. /**
  2108. * @access private
  2109. */
  2110. private $_tbase = 0x11a7;
  2111. /**
  2112. * @var int
  2113. * @access private
  2114. */
  2115. private $_lcount = 19;
  2116. /**
  2117. * @var int
  2118. * @access private
  2119. */
  2120. private $_vcount = 21;
  2121. /**
  2122. * @var int
  2123. * @access private
  2124. */
  2125. private $_tcount = 28;
  2126. /**
  2127. * vcount * tcount
  2128. *
  2129. * @var int
  2130. * @access private
  2131. */
  2132. private $_ncount = 588;
  2133. /**
  2134. * lcount * tcount * vcount
  2135. *
  2136. * @var int
  2137. * @access private
  2138. */
  2139. private $_scount = 11172;
  2140. /**
  2141. * Default encoding for encode()'s input and decode()'s output is UTF-8;
  2142. * Other possible encodings are ucs4_string and ucs4_array
  2143. * See {@link setParams()} for how to select these
  2144. *
  2145. * @var bool
  2146. * @access private
  2147. */
  2148. private $_api_encoding = 'utf8';
  2149. /**
  2150. * Overlong UTF-8 encodings are forbidden
  2151. *
  2152. * @var bool
  2153. * @access private
  2154. */
  2155. private $_allow_overlong = false;
  2156. /**
  2157. * Behave strict or not
  2158. *
  2159. * @var bool
  2160. * @access private
  2161. */
  2162. private $_strict_mode = false;
  2163. /**
  2164. * IDNA-version to use
  2165. *
  2166. * Values are "2003" and "2008".
  2167. * Defaults to "2003", since that was the original version and for
  2168. * compatibility with previous versions of this library.
  2169. * If you need to encode "new" characters like the German "Eszett",
  2170. * please switch to 2008 first before encoding.
  2171. *
  2172. * @var bool
  2173. * @access private
  2174. */
  2175. private $_version = '2003';
  2176. /**
  2177. * Cached value indicating whether or not mbstring function overloading is
  2178. * on for strlen
  2179. *
  2180. * This is cached for optimal performance.
  2181. *
  2182. * @var boolean
  2183. * @see Net_IDNA2::_byteLength()
  2184. */
  2185. private static $_mb_string_overload = null;
  2186. // }}}
  2187. // {{{ constructor
  2188. /**
  2189. * Constructor
  2190. *
  2191. * @param array|null $options Options to initialise the object with
  2192. *
  2193. * @access public
  2194. * @see setParams()
  2195. */
  2196. public function __construct($options = null)
  2197. {
  2198. $this->_slast = $this->_sbase + $this->_lcount * $this->_vcount * $this->_tcount;
  2199. if (is_array($options)) {
  2200. $this->setParams($options);
  2201. }
  2202. // populate mbstring overloading cache if not set
  2203. if (self::$_mb_string_overload === null) {
  2204. self::$_mb_string_overload = (extension_loaded('mbstring')
  2205. && (ini_get('mbstring.func_overload') & 0x02) === 0x02);
  2206. }
  2207. }
  2208. // }}}
  2209. /**
  2210. * Sets a new option value. Available options and values:
  2211. *
  2212. * [utf8 - Use either UTF-8 or ISO-8859-1 as input (true for UTF-8, false
  2213. * otherwise); The output is always UTF-8]
  2214. * [overlong - Unicode does not allow unnecessarily long encodings of chars,
  2215. * to allow this, set this parameter to true, else to false;
  2216. * default is false.]
  2217. * [strict - true: strict mode, good for registration purposes - Causes errors
  2218. * on failures; false: loose mode, ideal for "wildlife" applications
  2219. * by silently ignoring errors and returning the original input instead]
  2220. *
  2221. * @param mixed $option Parameter to set (string: single parameter; array of Parameter => Value pairs)
  2222. * @param string|false $value Value to use (if parameter 1 is a string)
  2223. *
  2224. * @return bool true on success, false otherwise
  2225. * @access public
  2226. */
  2227. public function setParams($option, $value = false): bool
  2228. {
  2229. if (!is_array($option)) {
  2230. $option = [$option => $value];
  2231. }
  2232. foreach ($option as $k => $v) {
  2233. switch ($k) {
  2234. case 'encoding':
  2235. switch ($v) {
  2236. case 'utf8':
  2237. case 'ucs4_string':
  2238. case 'ucs4_array':
  2239. $this->_api_encoding = $v;
  2240. break;
  2241. default:
  2242. throw new InvalidArgumentException('Set Parameter: Unknown parameter ' . $v . ' for option ' . $k);
  2243. }
  2244. break;
  2245. case 'overlong':
  2246. $this->_allow_overlong = ($v) ? true : false;
  2247. break;
  2248. case 'strict':
  2249. $this->_strict_mode = ($v) ? true : false;
  2250. break;
  2251. case 'version':
  2252. if (in_array($v, ['2003', '2008'])) {
  2253. $this->_version = $v;
  2254. } else {
  2255. throw new InvalidArgumentException('Set Parameter: Invalid parameter ' . $v . ' for option ' . $k);
  2256. }
  2257. break;
  2258. default:
  2259. return false;
  2260. }
  2261. }
  2262. return true;
  2263. }
  2264. /**
  2265. * Encode a given UTF-8 domain name.
  2266. *
  2267. * @param string $decoded Domain name (UTF-8 or UCS-4)
  2268. * @param string|false $one_time_encoding Desired input encoding, see {@link set_parameter}
  2269. * If not given will use default-encoding
  2270. *
  2271. * @return mixed Encoded Domain name (ACE string) / processed string
  2272. * @throws Exception
  2273. * @access public
  2274. */
  2275. public function encode(string $decoded, $one_time_encoding = false)
  2276. {
  2277. // Forcing conversion of input to UCS4 array
  2278. // If one time encoding is given, use this, else the objects property
  2279. switch (($one_time_encoding) ? $one_time_encoding : $this->_api_encoding) {
  2280. case 'utf8':
  2281. $decoded = $this->_utf8_to_ucs4($decoded);
  2282. break;
  2283. case 'ucs4_string':
  2284. $decoded = $this->_ucs4_string_to_ucs4($decoded);
  2285. // no break
  2286. case 'ucs4_array':
  2287. break;
  2288. default:
  2289. throw new InvalidArgumentException('Unsupported input format');
  2290. }
  2291. // No input, no output, what else did you expect?
  2292. if (empty($decoded)) {
  2293. return '';
  2294. }
  2295. // Anchors for iteration
  2296. $last_begin = 0;
  2297. // Output string
  2298. $output = '';
  2299. foreach ($decoded as $k => $v) {
  2300. // Make sure to use just the plain dot
  2301. switch ($v) {
  2302. case 0x3002:
  2303. case 0xFF0E:
  2304. case 0xFF61:
  2305. $decoded[$k] = 0x2E;
  2306. // It's right, no break here
  2307. // The codepoints above have to be converted to dots anyway
  2308. // Stumbling across an anchoring character
  2309. // no break
  2310. case 0x2E:
  2311. case 0x2F:
  2312. case 0x3A:
  2313. case 0x3F:
  2314. case 0x40:
  2315. // Neither email addresses nor URLs allowed in strict mode
  2316. if ($this->_strict_mode) {
  2317. throw new InvalidArgumentException('Neither email addresses nor URLs are allowed in strict mode.');
  2318. }
  2319. // Skip first char
  2320. if ($k) {
  2321. $encoded = '';
  2322. $encoded = $this->_encode(array_slice($decoded, $last_begin, (($k) - $last_begin)));
  2323. if ($encoded) {
  2324. $output .= $encoded;
  2325. } else {
  2326. $output .= $this->_ucs4_to_utf8(array_slice($decoded, $last_begin, (($k) - $last_begin)));
  2327. }
  2328. $output .= chr($decoded[$k]);
  2329. }
  2330. $last_begin = $k + 1;
  2331. }
  2332. }
  2333. // Catch the rest of the string
  2334. if ($last_begin) {
  2335. $inp_len = sizeof($decoded);
  2336. $encoded = '';
  2337. $encoded = $this->_encode(array_slice($decoded, $last_begin, (($inp_len) - $last_begin)));
  2338. if ($encoded) {
  2339. $output .= $encoded;
  2340. } else {
  2341. $output .= $this->_ucs4_to_utf8(array_slice($decoded, $last_begin, (($inp_len) - $last_begin)));
  2342. }
  2343. return $output;
  2344. }
  2345. if ($output = $this->_encode($decoded)) {
  2346. return $output;
  2347. }
  2348. return $this->_ucs4_to_utf8($decoded);
  2349. }
  2350. /**
  2351. * Decode a given ACE domain name.
  2352. *
  2353. * @param string $input Domain name (ACE string)
  2354. * @param string|false $one_time_encoding Desired output encoding, see {@link set_parameter}
  2355. *
  2356. * @return mixed Decoded Domain name (UTF-8 or UCS-4) / processed string
  2357. * @throws Exception
  2358. * @access public
  2359. */
  2360. public function decode(string $input, $one_time_encoding = false)
  2361. {
  2362. // Optionally set
  2363. if ($one_time_encoding) {
  2364. switch ($one_time_encoding) {
  2365. case 'utf8':
  2366. case 'ucs4_string':
  2367. case 'ucs4_array':
  2368. break;
  2369. default:
  2370. throw new InvalidArgumentException('Unknown encoding ' . $one_time_encoding);
  2371. }
  2372. }
  2373. // Make sure to drop any newline characters around
  2374. $input = trim($input);
  2375. // Negotiate input and try to determine, whether it is a plain string,
  2376. // an email address or something like a complete URL
  2377. if (strpos($input, '@')) { // Maybe it is an email address
  2378. // No no in strict mode
  2379. if ($this->_strict_mode) {
  2380. throw new InvalidArgumentException('Only simple domain name parts can be handled in strict mode');
  2381. }
  2382. list($email_pref, $input) = explode('@', $input, 2);
  2383. $arr = explode('.', $input);
  2384. foreach ($arr as $k => $v) {
  2385. $conv = $this->_decode($v);
  2386. if ($conv) {
  2387. $arr[$k] = $conv;
  2388. }
  2389. }
  2390. $return = $email_pref . '@' . join('.', $arr);
  2391. } elseif (preg_match('![:\./]!', $input)) { // Or a complete domain name (with or without paths / parameters)
  2392. // No no in strict mode
  2393. if ($this->_strict_mode) {
  2394. throw new InvalidArgumentException('Only simple domain name parts can be handled in strict mode');
  2395. }
  2396. $parsed = parse_url($input);
  2397. if (isset($parsed['host'])) {
  2398. $arr = explode('.', $parsed['host']);
  2399. foreach ($arr as $k => $v) {
  2400. $conv = $this->_decode($v);
  2401. if ($conv) {
  2402. $arr[$k] = $conv;
  2403. }
  2404. }
  2405. $parsed['host'] = join('.', $arr);
  2406. if (isset($parsed['scheme'])) {
  2407. $parsed['scheme'] .= (strtolower($parsed['scheme']) == 'mailto') ? ':' : '://';
  2408. }
  2409. $return = $this->_unparse_url($parsed);
  2410. } else { // parse_url seems to have failed, try without it
  2411. $arr = explode('.', $input);
  2412. foreach ($arr as $k => $v) {
  2413. $conv = $this->_decode($v);
  2414. if ($conv) {
  2415. $arr[$k] = $conv;
  2416. }
  2417. }
  2418. $return = join('.', $arr);
  2419. }
  2420. } else { // Otherwise we consider it being a pure domain name string
  2421. $return = $this->_decode($input);
  2422. }
  2423. // The output is UTF-8 by default, other output formats need conversion here
  2424. // If one time encoding is given, use this, else the objects property
  2425. switch (($one_time_encoding) ? $one_time_encoding : $this->_api_encoding) {
  2426. case 'utf8':
  2427. return $return;
  2428. break;
  2429. case 'ucs4_string':
  2430. return $this->_ucs4_to_ucs4_string($this->_utf8_to_ucs4($return));
  2431. break;
  2432. case 'ucs4_array':
  2433. return $this->_utf8_to_ucs4($return);
  2434. break;
  2435. default:
  2436. throw new InvalidArgumentException('Unsupported output format');
  2437. }
  2438. }
  2439. // {{{ private
  2440. /**
  2441. * Opposite function to parse_url()
  2442. *
  2443. * Inspired by code from comments of php.net-documentation for parse_url()
  2444. *
  2445. * @param array $parts_arr parts (strings) as returned by parse_url()
  2446. *
  2447. * @return string
  2448. * @access private
  2449. */
  2450. private function _unparse_url(array $parts_arr): string
  2451. {
  2452. if (!empty($parts_arr['scheme'])) {
  2453. $ret_url = $parts_arr['scheme'];
  2454. }
  2455. if (!empty($parts_arr['user'])) {
  2456. $ret_url .= $parts_arr['user'];
  2457. if (!empty($parts_arr['pass'])) {
  2458. $ret_url .= ':' . $parts_arr['pass'];
  2459. }
  2460. $ret_url .= '@';
  2461. }
  2462. $ret_url .= $parts_arr['host'];
  2463. if (!empty($parts_arr['port'])) {
  2464. $ret_url .= ':' . $parts_arr['port'];
  2465. }
  2466. $ret_url .= $parts_arr['path'];
  2467. if (!empty($parts_arr['query'])) {
  2468. $ret_url .= '?' . $parts_arr['query'];
  2469. }
  2470. if (!empty($parts_arr['fragment'])) {
  2471. $ret_url .= '#' . $parts_arr['fragment'];
  2472. }
  2473. return $ret_url;
  2474. }
  2475. /**
  2476. * The actual encoding algorithm.
  2477. *
  2478. * @param array of strings $decoded Decoded string which should be encoded
  2479. *
  2480. * @return string Encoded string
  2481. * @throws Exception
  2482. * @access private
  2483. */
  2484. private function _encode($decoded): string
  2485. {
  2486. // We cannot encode a domain name containing the Punycode prefix
  2487. $extract = self::_byteLength($this->_punycode_prefix);
  2488. $check_pref = $this->_utf8_to_ucs4($this->_punycode_prefix);
  2489. $check_deco = array_slice($decoded, 0, $extract);
  2490. if ($check_pref == $check_deco) {
  2491. throw new InvalidArgumentException('This is already a punycode string');
  2492. }
  2493. // We will not try to encode strings consisting of basic code points only
  2494. $encodable = false;
  2495. foreach ($decoded as $k => $v) {
  2496. if ($v > 0x7a) {
  2497. $encodable = true;
  2498. break;
  2499. }
  2500. }
  2501. if (!$encodable) {
  2502. if ($this->_strict_mode) {
  2503. throw new InvalidArgumentException('The given string does not contain encodable chars');
  2504. }
  2505. return false;
  2506. }
  2507. // Do NAMEPREP
  2508. $decoded = $this->_nameprep($decoded);
  2509. $deco_len = count($decoded);
  2510. // Empty array
  2511. if (!$deco_len) {
  2512. return false;
  2513. }
  2514. // How many chars have been consumed
  2515. $codecount = 0;
  2516. // Start with the prefix; copy it to output
  2517. $encoded = $this->_punycode_prefix;
  2518. $encoded = '';
  2519. // Copy all basic code points to output
  2520. for ($i = 0; $i < $deco_len; ++$i) {
  2521. $test = $decoded[$i];
  2522. // Will match [0-9a-zA-Z-]
  2523. if ((0x2F < $test && $test < 0x40)
  2524. || (0x40 < $test && $test < 0x5B)
  2525. || (0x60 < $test && $test <= 0x7B)
  2526. || (0x2D == $test)
  2527. ) {
  2528. $encoded .= chr($decoded[$i]);
  2529. $codecount++;
  2530. }
  2531. }
  2532. // All codepoints were basic ones
  2533. if ($codecount == $deco_len) {
  2534. return $encoded;
  2535. }
  2536. // Start with the prefix; copy it to output
  2537. $encoded = $this->_punycode_prefix . $encoded;
  2538. // If we have basic code points in output, add an hyphen to the end
  2539. if ($codecount) {
  2540. $encoded .= '-';
  2541. }
  2542. // Now find and encode all non-basic code points
  2543. $is_first = true;
  2544. $cur_code = $this->_initial_n;
  2545. $bias = $this->_initial_bias;
  2546. $delta = 0;
  2547. while ($codecount < $deco_len) {
  2548. // Find the smallest code point >= the current code point and
  2549. // remember the last ouccrence of it in the input
  2550. for ($i = 0, $next_code = $this->_max_ucs; $i < $deco_len; $i++) {
  2551. if ($decoded[$i] >= $cur_code && $decoded[$i] <= $next_code) {
  2552. $next_code = $decoded[$i];
  2553. }
  2554. }
  2555. $delta += ($next_code - $cur_code) * ($codecount + 1);
  2556. $cur_code = $next_code;
  2557. // Scan input again and encode all characters whose code point is $cur_code
  2558. for ($i = 0; $i < $deco_len; $i++) {
  2559. if ($decoded[$i] < $cur_code) {
  2560. $delta++;
  2561. } elseif ($decoded[$i] == $cur_code) {
  2562. for ($q = $delta, $k = $this->_base; 1; $k += $this->_base) {
  2563. $t = ($k <= $bias) ?
  2564. $this->_tmin :
  2565. (($k >= $bias + $this->_tmax) ? $this->_tmax : $k - $bias);
  2566. if ($q < $t) {
  2567. break;
  2568. }
  2569. $encoded .= $this->_encodeDigit(ceil($t + (($q - $t) % ($this->_base - $t))));
  2570. $q = ($q - $t) / ($this->_base - $t);
  2571. }
  2572. $encoded .= $this->_encodeDigit($q);
  2573. $bias = $this->_adapt($delta, $codecount + 1, $is_first);
  2574. $codecount++;
  2575. $delta = 0;
  2576. $is_first = false;
  2577. }
  2578. }
  2579. $delta++;
  2580. $cur_code++;
  2581. }
  2582. return $encoded;
  2583. }
  2584. /**
  2585. * The actual decoding algorithm.
  2586. *
  2587. * @param string $encoded Encoded string which should be decoded
  2588. *
  2589. * @return string Decoded string
  2590. * @throws Exception
  2591. * @access private
  2592. */
  2593. private function _decode($encoded): string
  2594. {
  2595. // We do need to find the Punycode prefix
  2596. if (!preg_match('!^' . preg_quote($this->_punycode_prefix, '!') . '!', $encoded)) {
  2597. return false;
  2598. }
  2599. $encode_test = preg_replace('!^' . preg_quote($this->_punycode_prefix, '!') . '!', '', $encoded);
  2600. // If nothing left after removing the prefix, it is hopeless
  2601. if (!$encode_test) {
  2602. return false;
  2603. }
  2604. // Find last occurrence of the delimiter
  2605. $delim_pos = strrpos($encoded, '-');
  2606. if ($delim_pos > self::_byteLength($this->_punycode_prefix)) {
  2607. for ($k = self::_byteLength($this->_punycode_prefix); $k < $delim_pos; ++$k) {
  2608. $decoded[] = ord($encoded[$k]);
  2609. }
  2610. } else {
  2611. $decoded = [];
  2612. }
  2613. $deco_len = count($decoded);
  2614. $enco_len = self::_byteLength($encoded);
  2615. // Wandering through the strings; init
  2616. $is_first = true;
  2617. $bias = $this->_initial_bias;
  2618. $idx = 0;
  2619. $char = $this->_initial_n;
  2620. for ($enco_idx = ($delim_pos) ? ($delim_pos + 1) : 0; $enco_idx < $enco_len; ++$deco_len) {
  2621. for ($old_idx = $idx, $w = 1, $k = $this->_base; 1; $k += $this->_base) {
  2622. $digit = $this->_decodeDigit($encoded[$enco_idx++]);
  2623. $idx += $digit * $w;
  2624. $t = ($k <= $bias) ?
  2625. $this->_tmin :
  2626. (($k >= $bias + $this->_tmax) ? $this->_tmax : ($k - $bias));
  2627. if ($digit < $t) {
  2628. break;
  2629. }
  2630. $w = (int)($w * ($this->_base - $t));
  2631. }
  2632. $bias = $this->_adapt($idx - $old_idx, $deco_len + 1, $is_first);
  2633. $is_first = false;
  2634. $char += (int)($idx / ($deco_len + 1));
  2635. $idx %= ($deco_len + 1);
  2636. if ($deco_len > 0) {
  2637. // Make room for the decoded char
  2638. for ($i = $deco_len; $i > $idx; $i--) {
  2639. $decoded[$i] = $decoded[($i - 1)];
  2640. }
  2641. }
  2642. $decoded[$idx++] = $char;
  2643. }
  2644. return $this->_ucs4_to_utf8($decoded);
  2645. }
  2646. /**
  2647. * Adapt the bias according to the current code point and position.
  2648. *
  2649. * @param int $delta ...
  2650. * @param int $npoints ...
  2651. * @param bool $is_first ...
  2652. *
  2653. * @return int
  2654. * @access private
  2655. */
  2656. private function _adapt(int $delta, int $npoints, bool $is_first): int
  2657. {
  2658. $delta = (int)($is_first ? ($delta / $this->_damp) : ($delta / 2));
  2659. $delta += (int)($delta / $npoints);
  2660. for ($k = 0; $delta > (($this->_base - $this->_tmin) * $this->_tmax) / 2; $k += $this->_base) {
  2661. $delta = (int)($delta / ($this->_base - $this->_tmin));
  2662. }
  2663. return (int)($k + ($this->_base - $this->_tmin + 1) * $delta / ($delta + $this->_skew));
  2664. }
  2665. /**
  2666. * Encoding a certain digit.
  2667. *
  2668. * @param int $d One digit to encode
  2669. *
  2670. * @return string (char) Encoded digit
  2671. * @access private
  2672. */
  2673. private function _encodeDigit(int $d): string
  2674. {
  2675. return chr($d + 22 + 75 * ($d < 26));
  2676. }
  2677. /**
  2678. * Decode a certain digit.
  2679. *
  2680. * @param string (char) $cp One digit (character) to decode
  2681. *
  2682. * @return int Decoded digit
  2683. * @access private
  2684. */
  2685. private function _decodeDigit(string $cp): int
  2686. {
  2687. $cp = ord($cp);
  2688. return ($cp - 48 < 10) ? $cp - 22 : (($cp - 65 < 26) ? $cp - 65 : (($cp - 97 < 26) ? $cp - 97 : $this->_base));
  2689. }
  2690. /**
  2691. * Do Nameprep according to RFC3491 and RFC3454.
  2692. *
  2693. * @param array $input Unicode Characters
  2694. *
  2695. * @return array of strings Unicode Characters, Nameprep'd
  2696. * @throws Exception
  2697. * @access private
  2698. */
  2699. private function _nameprep(array $input): array
  2700. {
  2701. $output = [];
  2702. // Walking through the input array, performing the required steps on each of
  2703. // the input chars and putting the result into the output array
  2704. // While mapping required chars we apply the canonical ordering
  2705. foreach ($input as $v) {
  2706. // Map to nothing == skip that code point
  2707. if (in_array($v, self::$_np_map_nothing)) {
  2708. continue;
  2709. }
  2710. // Try to find prohibited input
  2711. if (in_array($v, self::$_np_prohibit) || in_array($v, self::$_general_prohibited)) {
  2712. throw new Net_IDNA2_Exception_Nameprep('Prohibited input U+' . sprintf('%08X', $v));
  2713. }
  2714. foreach (self::$_np_prohibit_ranges as $range) {
  2715. if ($range[0] <= $v && $v <= $range[1]) {
  2716. throw new Net_IDNA2_Exception_Nameprep('Prohibited input U+' . sprintf('%08X', $v));
  2717. }
  2718. }
  2719. // Hangul syllable decomposition
  2720. if (0xAC00 <= $v && $v <= 0xD7AF) {
  2721. foreach ($this->_hangulDecompose($v) as $out) {
  2722. $output[] = $out;
  2723. }
  2724. } elseif (($this->_version == '2003') && isset(self::$_np_replacemaps[$v])) {
  2725. // There's a decomposition mapping for that code point
  2726. // Decompositions only in version 2003 (original) of IDNA
  2727. foreach ($this->_applyCannonicalOrdering(self::$_np_replacemaps[$v]) as $out) {
  2728. $output[] = $out;
  2729. }
  2730. } else {
  2731. $output[] = $v;
  2732. }
  2733. }
  2734. // Combine code points
  2735. $last_class = 0;
  2736. $last_starter = 0;
  2737. $out_len = count($output);
  2738. for ($i = 0; $i < $out_len; ++$i) {
  2739. $class = $this->_getCombiningClass($output[$i]);
  2740. if ((!$last_class || $last_class != $class) && $class) {
  2741. // Try to match
  2742. $seq_len = $i - $last_starter;
  2743. $out = $this->_combine(array_slice($output, $last_starter, $seq_len));
  2744. // On match: Replace the last starter with the composed character and remove
  2745. // the now redundant non-starter(s)
  2746. if ($out) {
  2747. $output[$last_starter] = $out;
  2748. if (count($out) != $seq_len) {
  2749. for ($j = $i + 1; $j < $out_len; ++$j) {
  2750. $output[$j - 1] = $output[$j];
  2751. }
  2752. unset($output[$out_len]);
  2753. }
  2754. // Rewind the for loop by one, since there can be more possible compositions
  2755. $i--;
  2756. $out_len--;
  2757. $last_class = ($i == $last_starter) ? 0 : $this->_getCombiningClass($output[$i - 1]);
  2758. continue;
  2759. }
  2760. }
  2761. // The current class is 0
  2762. if (!$class) {
  2763. $last_starter = $i;
  2764. }
  2765. $last_class = $class;
  2766. }
  2767. return $output;
  2768. }
  2769. /**
  2770. * Decomposes a Hangul syllable
  2771. * (see http://www.unicode.org/unicode/reports/tr15/#Hangul).
  2772. *
  2773. * @param int $char 32bit UCS4 code point
  2774. *
  2775. * @return array Either Hangul Syllable decomposed or original 32bit
  2776. * value as one value array
  2777. * @access private
  2778. */
  2779. private function _hangulDecompose(int $char): array
  2780. {
  2781. $sindex = $char - $this->_sbase;
  2782. if ($sindex < 0 || $sindex >= $this->_scount) {
  2783. return [$char];
  2784. }
  2785. $result = [];
  2786. $T = $this->_tbase + $sindex % $this->_tcount;
  2787. $result[] = (int)($this->_lbase + $sindex / $this->_ncount);
  2788. $result[] = (int)($this->_vbase + ($sindex % $this->_ncount) / $this->_tcount);
  2789. if ($T != $this->_tbase) {
  2790. $result[] = $T;
  2791. }
  2792. return $result;
  2793. }
  2794. /**
  2795. * Ccomposes a Hangul syllable
  2796. * (see http://www.unicode.org/unicode/reports/tr15/#Hangul).
  2797. *
  2798. * @param array $input Decomposed UCS4 sequence
  2799. *
  2800. * @return array UCS4 sequence with syllables composed
  2801. * @access private
  2802. */
  2803. private function _hangulCompose(array $input): array
  2804. {
  2805. $inp_len = count($input);
  2806. if (!$inp_len) {
  2807. return [];
  2808. }
  2809. $result = [];
  2810. $last = $input[0];
  2811. $result[] = $last; // copy first char from input to output
  2812. for ($i = 1; $i < $inp_len; ++$i) {
  2813. $char = $input[$i];
  2814. // Find out, wether two current characters from L and V
  2815. $lindex = $last - $this->_lbase;
  2816. if (0 <= $lindex && $lindex < $this->_lcount) {
  2817. $vindex = $char - $this->_vbase;
  2818. if (0 <= $vindex && $vindex < $this->_vcount) {
  2819. // create syllable of form LV
  2820. $last = ($this->_sbase + ($lindex * $this->_vcount + $vindex) * $this->_tcount);
  2821. $out_off = count($result) - 1;
  2822. $result[$out_off] = $last; // reset last
  2823. // discard char
  2824. continue;
  2825. }
  2826. }
  2827. // Find out, wether two current characters are LV and T
  2828. $sindex = $last - $this->_sbase;
  2829. if (0 <= $sindex && $sindex < $this->_scount && ($sindex % $this->_tcount) == 0) {
  2830. $tindex = $char - $this->_tbase;
  2831. if (0 <= $tindex && $tindex <= $this->_tcount) {
  2832. // create syllable of form LVT
  2833. $last += $tindex;
  2834. $out_off = count($result) - 1;
  2835. $result[$out_off] = $last; // reset last
  2836. // discard char
  2837. continue;
  2838. }
  2839. }
  2840. // if neither case was true, just add the character
  2841. $last = $char;
  2842. $result[] = $char;
  2843. }
  2844. return $result;
  2845. }
  2846. /**
  2847. * Returns the combining class of a certain wide char.
  2848. *
  2849. * @param integer $char Wide char to check (32bit integer)
  2850. *
  2851. * @return int Combining class if found, else 0
  2852. * @access private
  2853. */
  2854. private function _getCombiningClass(int $char): int
  2855. {
  2856. return isset(self::$_np_norm_combcls[$char]) ? self::$_np_norm_combcls[$char] : 0;
  2857. }
  2858. /**
  2859. * Apllies the canonical ordering of a decomposed UCS4 sequence.
  2860. *
  2861. * @param array $input Decomposed UCS4 sequence
  2862. *
  2863. * @return array Ordered USC4 sequence
  2864. * @access private
  2865. */
  2866. private function _applyCannonicalOrdering(array $input): array
  2867. {
  2868. $swap = true;
  2869. $size = count($input);
  2870. while ($swap) {
  2871. $swap = false;
  2872. $last = $this->_getCombiningClass($input[0]);
  2873. for ($i = 0; $i < $size - 1; ++$i) {
  2874. $next = $this->_getCombiningClass($input[$i + 1]);
  2875. if ($next != 0 && $last > $next) {
  2876. // Move item leftward until it fits
  2877. for ($j = $i + 1; $j > 0; --$j) {
  2878. if ($this->_getCombiningClass($input[$j - 1]) <= $next) {
  2879. break;
  2880. }
  2881. $t = $input[$j];
  2882. $input[$j] = $input[$j - 1];
  2883. $input[$j - 1] = $t;
  2884. $swap = 1;
  2885. }
  2886. // Reentering the loop looking at the old character again
  2887. $next = $last;
  2888. }
  2889. $last = $next;
  2890. }
  2891. }
  2892. return $input;
  2893. }
  2894. /**
  2895. * Do composition of a sequence of starter and non-starter.
  2896. *
  2897. * @param array $input UCS4 Decomposed sequence
  2898. *
  2899. * @return array|false Ordered USC4 sequence
  2900. * @access private
  2901. */
  2902. private function _combine($input)
  2903. {
  2904. $inp_len = count($input);
  2905. // Is it a Hangul syllable?
  2906. if (1 != $inp_len) {
  2907. $hangul = $this->_hangulCompose($input);
  2908. // This place is probably wrong
  2909. if (count($hangul) != $inp_len) {
  2910. return $hangul;
  2911. }
  2912. }
  2913. foreach (self::$_np_replacemaps as $np_src => $np_target) {
  2914. if ($np_target[0] != $input[0]) {
  2915. continue;
  2916. }
  2917. if (count($np_target) != $inp_len) {
  2918. continue;
  2919. }
  2920. $hit = false;
  2921. foreach ($input as $k2 => $v2) {
  2922. if ($v2 == $np_target[$k2]) {
  2923. $hit = true;
  2924. } else {
  2925. $hit = false;
  2926. break;
  2927. }
  2928. }
  2929. if ($hit) {
  2930. return $np_src;
  2931. }
  2932. }
  2933. return false;
  2934. }
  2935. /**
  2936. * This converts an UTF-8 encoded string to its UCS-4 (array) representation
  2937. * By talking about UCS-4 we mean arrays of 32bit integers representing
  2938. * each of the "chars". This is due to PHP not being able to handle strings with
  2939. * bit depth different from 8. This applies to the reverse method _ucs4_to_utf8(), too.
  2940. * The following UTF-8 encodings are supported:
  2941. *
  2942. * bytes bits representation
  2943. * 1 7 0xxxxxxx
  2944. * 2 11 110xxxxx 10xxxxxx
  2945. * 3 16 1110xxxx 10xxxxxx 10xxxxxx
  2946. * 4 21 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
  2947. * 5 26 111110xx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx
  2948. * 6 31 1111110x 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx
  2949. *
  2950. * Each x represents a bit that can be used to store character data.
  2951. *
  2952. * @param string $input utf8-encoded string
  2953. *
  2954. * @return array ucs4-encoded array
  2955. * @throws Exception
  2956. * @access private
  2957. */
  2958. private function _utf8_to_ucs4(string $input): array
  2959. {
  2960. $output = [];
  2961. $out_len = 0;
  2962. $inp_len = self::_byteLength($input, '8bit');
  2963. $mode = 'next';
  2964. $test = 'none';
  2965. for ($k = 0; $k < $inp_len; ++$k) {
  2966. $v = ord($input[$k]); // Extract byte from input string
  2967. if ($v < 128) { // We found an ASCII char - put into string as is
  2968. $output[$out_len] = $v;
  2969. ++$out_len;
  2970. if ('add' == $mode) {
  2971. throw new UnexpectedValueException('Conversion from UTF-8 to UCS-4 failed: malformed input at byte ' . $k);
  2972. }
  2973. continue;
  2974. }
  2975. if ('next' == $mode) { // Try to find the next start byte; determine the width of the Unicode char
  2976. $start_byte = $v;
  2977. $mode = 'add';
  2978. $test = 'range';
  2979. if ($v >> 5 == 6) { // &110xxxxx 10xxxxx
  2980. $next_byte = 0; // Tells, how many times subsequent bitmasks must rotate 6bits to the left
  2981. $v = ($v - 192) << 6;
  2982. } elseif ($v >> 4 == 14) { // &1110xxxx 10xxxxxx 10xxxxxx
  2983. $next_byte = 1;
  2984. $v = ($v - 224) << 12;
  2985. } elseif ($v >> 3 == 30) { // &11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
  2986. $next_byte = 2;
  2987. $v = ($v - 240) << 18;
  2988. } elseif ($v >> 2 == 62) { // &111110xx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx
  2989. $next_byte = 3;
  2990. $v = ($v - 248) << 24;
  2991. } elseif ($v >> 1 == 126) { // &1111110x 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx 10xxxxxx
  2992. $next_byte = 4;
  2993. $v = ($v - 252) << 30;
  2994. } else {
  2995. throw new UnexpectedValueException('This might be UTF-8, but I don\'t understand it at byte ' . $k);
  2996. }
  2997. if ('add' == $mode) {
  2998. $output[$out_len] = (int)$v;
  2999. ++$out_len;
  3000. continue;
  3001. }
  3002. }
  3003. if ('add' == $mode) {
  3004. if (!$this->_allow_overlong && $test == 'range') {
  3005. $test = 'none';
  3006. if (($v < 0xA0 && $start_byte == 0xE0) || ($v < 0x90 && $start_byte == 0xF0) || ($v > 0x8F && $start_byte == 0xF4)) {
  3007. throw new OutOfRangeException('Bogus UTF-8 character detected (out of legal range) at byte ' . $k);
  3008. }
  3009. }
  3010. if ($v >> 6 == 2) { // Bit mask must be 10xxxxxx
  3011. $v = ($v - 128) << ($next_byte * 6);
  3012. $output[($out_len - 1)] += $v;
  3013. --$next_byte;
  3014. } else {
  3015. throw new UnexpectedValueException('Conversion from UTF-8 to UCS-4 failed: malformed input at byte ' . $k);
  3016. }
  3017. if ($next_byte < 0) {
  3018. $mode = 'next';
  3019. }
  3020. }
  3021. } // for
  3022. return $output;
  3023. }
  3024. /**
  3025. * Convert UCS-4 array into UTF-8 string
  3026. *
  3027. * @param array $input ucs4-encoded array
  3028. *
  3029. * @return string utf8-encoded string
  3030. * @throws Exception
  3031. * @access private
  3032. */
  3033. private function _ucs4_to_utf8(array $input): string
  3034. {
  3035. $output = '';
  3036. foreach ($input as $v) {
  3037. // $v = ord($v);
  3038. if ($v < 128) {
  3039. // 7bit are transferred literally
  3040. $output .= chr($v);
  3041. } elseif ($v < 1 << 11) {
  3042. // 2 bytes
  3043. $output .= chr(192 + ($v >> 6))
  3044. . chr(128 + ($v & 63));
  3045. } elseif ($v < 1 << 16) {
  3046. // 3 bytes
  3047. $output .= chr(224 + ($v >> 12))
  3048. . chr(128 + (($v >> 6) & 63))
  3049. . chr(128 + ($v & 63));
  3050. } elseif ($v < 1 << 21) {
  3051. // 4 bytes
  3052. $output .= chr(240 + ($v >> 18))
  3053. . chr(128 + (($v >> 12) & 63))
  3054. . chr(128 + (($v >> 6) & 63))
  3055. . chr(128 + ($v & 63));
  3056. } elseif ($v < 1 << 26) {
  3057. // 5 bytes
  3058. $output .= chr(248 + ($v >> 24))
  3059. . chr(128 + (($v >> 18) & 63))
  3060. . chr(128 + (($v >> 12) & 63))
  3061. . chr(128 + (($v >> 6) & 63))
  3062. . chr(128 + ($v & 63));
  3063. } elseif ($v < 1 << 31) {
  3064. // 6 bytes
  3065. $output .= chr(252 + ($v >> 30))
  3066. . chr(128 + (($v >> 24) & 63))
  3067. . chr(128 + (($v >> 18) & 63))
  3068. . chr(128 + (($v >> 12) & 63))
  3069. . chr(128 + (($v >> 6) & 63))
  3070. . chr(128 + ($v & 63));
  3071. } else {
  3072. throw new UnexpectedValueException('Conversion from UCS-4 to UTF-8 failed: malformed input');
  3073. }
  3074. }
  3075. return $output;
  3076. }
  3077. /**
  3078. * Convert UCS-4 array into UCS-4 string
  3079. *
  3080. * @param array $input ucs4-encoded array
  3081. *
  3082. * @return string ucs4-encoded string
  3083. * @throws Exception
  3084. * @access private
  3085. */
  3086. private function _ucs4_to_ucs4_string(array $input): string
  3087. {
  3088. $output = '';
  3089. // Take array values and split output to 4 bytes per value
  3090. // The bit mask is 255, which reads &11111111
  3091. foreach ($input as $v) {
  3092. $output .= ($v & (255 << 24) >> 24) . ($v & (255 << 16) >> 16) . ($v & (255 << 8) >> 8) . ($v & 255);
  3093. }
  3094. return $output;
  3095. }
  3096. /**
  3097. * Convert UCS-4 string into UCS-4 array
  3098. *
  3099. * @param string $input ucs4-encoded string
  3100. *
  3101. * @return array ucs4-encoded array
  3102. * @throws InvalidArgumentException
  3103. * @access private
  3104. */
  3105. private function _ucs4_string_to_ucs4(string $input): array
  3106. {
  3107. $output = [];
  3108. $inp_len = self::_byteLength($input);
  3109. // Input length must be dividable by 4
  3110. if ($inp_len % 4) {
  3111. throw new InvalidArgumentException('Input UCS4 string is broken');
  3112. }
  3113. // Empty input - return empty output
  3114. if (!$inp_len) {
  3115. return $output;
  3116. }
  3117. for ($i = 0, $out_len = -1; $i < $inp_len; ++$i) {
  3118. // Increment output position every 4 input bytes
  3119. if (!$i % 4) {
  3120. $out_len++;
  3121. $output[$out_len] = 0;
  3122. }
  3123. $output[$out_len] += ord($input[$i]) << (8 * (3 - ($i % 4)));
  3124. }
  3125. return $output;
  3126. }
  3127. /**
  3128. * Echo hex representation of UCS4 sequence.
  3129. *
  3130. * @param array $input UCS4 sequence
  3131. * @param bool $include_bit Include bitmask in output
  3132. *
  3133. * @return void
  3134. * @static
  3135. * @access private
  3136. */
  3137. private static function _showHex(array $input, bool $include_bit = false): void
  3138. {
  3139. foreach ($input as $k => $v) {
  3140. echo '[', $k, '] => ', sprintf('%X', $v);
  3141. if ($include_bit) {
  3142. echo ' (', Net_IDNA2::_showBitmask($v), ')';
  3143. }
  3144. echo "\n";
  3145. }
  3146. }
  3147. /**
  3148. * Gives you a bit representation of given Byte (8 bits), Word (16 bits) or DWord (32 bits)
  3149. * Output width is automagically determined
  3150. *
  3151. * @param int $octet ...
  3152. *
  3153. * @return string Bitmask-representation
  3154. * @static
  3155. * @access private
  3156. */
  3157. private static function _showBitmask(int $octet): string
  3158. {
  3159. if ($octet >= (1 << 16)) {
  3160. $w = 31;
  3161. } elseif ($octet >= (1 << 8)) {
  3162. $w = 15;
  3163. } else {
  3164. $w = 7;
  3165. }
  3166. $return = '';
  3167. for ($i = $w; $i > -1; $i--) {
  3168. $return .= ($octet & (1 << $i)) ? '1' : '0';
  3169. }
  3170. return $return;
  3171. }
  3172. /**
  3173. * Gets the length of a string in bytes even if mbstring function
  3174. * overloading is turned on
  3175. *
  3176. * @param string $string the string for which to get the length.
  3177. * @param string $encoding [optional] &mbstring.encoding.parameter;
  3178. *
  3179. * @return int the length of the string in bytes.
  3180. *
  3181. * @see Net_IDNA2::$_mb_string_overload
  3182. */
  3183. private static function _byteLength(string $string, string $encoding = '8bit'): int
  3184. {
  3185. if (self::$_mb_string_overload) {
  3186. return mb_strlen($string, $encoding);
  3187. }
  3188. return strlen((binary)$string);
  3189. }
  3190. // }}}}
  3191. // {{{ factory
  3192. /**
  3193. * Attempts to return a concrete IDNA instance for either php4 or php5.
  3194. *
  3195. * @param array $params Set of paramaters
  3196. *
  3197. * @return Net_IDNA2
  3198. * @access public
  3199. */
  3200. public static function getInstance(array $params = []): Net_IDNA2
  3201. {
  3202. return new Net_IDNA2($params);
  3203. }
  3204. // }}}
  3205. // {{{ singleton
  3206. /**
  3207. * Attempts to return a concrete IDNA instance for either php4 or php5,
  3208. * only creating a new instance if no IDNA instance with the same
  3209. * parameters currently exists.
  3210. *
  3211. * @param array $params Set of parameters
  3212. *
  3213. * @return Net_IDNA2
  3214. * @access public
  3215. */
  3216. public static function singleton(array $params = []): Net_IDNA2
  3217. {
  3218. static $instances;
  3219. if (!isset($instances)) {
  3220. $instances = [];
  3221. }
  3222. $signature = serialize($params);
  3223. if (!isset($instances[$signature])) {
  3224. $instances[$signature] = Net_IDNA2::getInstance($params);
  3225. }
  3226. return $instances[$signature];
  3227. }
  3228. // }}}
  3229. }