index-xnf.mjs 51 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065
  1. // created 2023-09-25T01:01:55.148Z
  2. // compressed base64-encoded blob for include-ens data
  3. // source: https://github.com/adraffy/ens-normalize.js/blob/main/src/make.js
  4. // see: https://github.com/adraffy/ens-normalize.js#security
  5. // SHA-256: 0565ed049b9cf1614bb9e11ba7d8ac6a6fb96c893253d890f7e2b2884b9ded32
  6. var COMPRESSED = 'AEEUdwmgDS8BxQKKAP4BOgDjATAAngDUAIMAoABoAOAAagCOAEQAhABMAHIAOwA9ACsANgAmAGIAHgAuACgAJwAXAC0AGgAjAB8ALwAUACkAEgAeAAkAGwARABkAFgA5ACgALQArADcAFQApABAAHgAiABAAGgAeABMAGAUhBe8BFxREN8sF2wC5AK5HAW8ArQkDzQCuhzc3NzcBP68NEfMABQdHBuw5BV8FYAA9MzkI9r4ZBg7QyQAWA9CeOwLNCjcCjqkChuA/lm+RAsXTAoP6ASfnEQDytQFJAjWVCkeXAOsA6godAB/cwdAUE0WlBCN/AQUCQRjFD/MRBjHxDQSJbw0jBzUAswBxme+tnIcAYwabAysG8QAjAEMMmxcDqgPKQyDXCMMxA7kUQwD3NXOrAKmFIAAfBC0D3x4BJQDBGdUFAhEgVD8JnwmQJiNWYUzrg0oAGwAUAB0AFnNcACkAFgBP9h3gPfsDOWDKneY2ChglX1UDYD30ABsAFAAdABZzIGRAnwDD8wAjAEEMzRbDqgMB2sAFYwXqAtCnAsS4AwpUJKRtFHsadUz9AMMVbwLpABM1NJEX0ZkCgYMBEyMAxRVvAukAEzUBUFAtmUwSAy4DBTER33EftQHfSwB5MxJ/AjkWKQLzL8E/cwBB6QH9LQDPDtO9ASNriQC5DQANAwCK21EFI91zHwCoL9kBqQcHBwcHKzUDowBvAQohPvU3fAQgHwCyAc8CKQMA5zMSezr7ULgFmDp/LzVQBgEGAi8FYQVgt8AFcTtlQhpCWEmfe5tmZ6IAExsDzQ8t+X8rBKtTAltbAn0jsy8Bl6utPWMDTR8Ei2kRANkDBrNHNysDBzECQWUAcwFpJ3kAiyUhAJ0BUb8AL3EfAbfNAz81KUsFWwF3YQZtAm0A+VEfAzEJDQBRSQCzAQBlAHsAM70GD/v3IZWHBwARKQAxALsjTwHZAeMPEzmXgIHwABIAGQA8AEUAQDt3gdvIEGcQZAkGTRFMdEIVEwK0D64L7REdDNkq09PgADSxB/MDWwfzA1sDWwfzB/MDWwfzA1sDWwNbA1scEvAi28gQZw9QBHUFlgWTBN4IiyZREYkHMAjaVBV0JhxPA00BBCMtSSQ7mzMTJUpMFE0LCAQ2SmyvfUADTzGzVP2QqgPTMlc5dAkGHnkSqAAyD3skNb1OhnpPcagKU0+2tYdJak5vAsY6sEAACikJm2/Dd1YGRRAfJ6kQ+ww3AbkBPw3xS9wE9QY/BM0fgRkdD9GVoAipLeEM8SbnLqWAXiP5KocF8Uv4POELUVFsD10LaQnnOmeBUgMlAREijwrhDT0IcRD3Cs1vDekRSQc9A9lJngCpBwULFR05FbkmFGKwCw05ewb/GvoLkyazEy17AAXXGiUGUQEtGwMA0y7rhbRaNVwgT2MGBwspI8sUrFAkDSlAu3hMGh8HGSWtApVDdEqLUToelyH6PEENai4XUYAH+TwJGVMLhTyiRq9FEhHWPpE9TCJNTDAEOYMsMyePCdMPiQy9fHYBXQklCbUMdRM1ERs3yQg9Bx0xlygnGQglRplgngT7owP3E9UDDwVDCUUHFwO5HDETMhUtBRGBKNsC9zbZLrcCk1aEARsFzw8pH+MQVEfkDu0InwJpA4cl7wAxFSUAGyKfCEdnAGOP3FMJLs8Iy2pwI3gDaxTrZRF3B5UOWwerHDcVwxzlcMxeD4YMKKezCV8BeQmdAWME5wgNNV+MpCBFZ1eLXBifIGVBQ14AAjUMaRWjRMGHfAKPD28SHwE5AXcHPQ0FAnsR8RFvEJkI74YINbkz/DopBFMhhyAVCisDU2zSCysm/Qz8bQGnEmYDEDRBd/Jnr2C6KBgBBx0yyUFkIfULlk/RDKAaxRhGVDIZ6AfDA/ca9yfuQVsGAwOnBxc6UTPyBMELbQiPCUMATQ6nGwfbGG4KdYzUATWPAbudA1uVhwJzkwY7Bw8Aaw+LBX3pACECqwinAAkA0wNbAD0CsQehAB0AiUUBQQMrMwEl6QKTA5cINc8BmTMB9y0EH8cMGQD7O25OAsO1AoBuZqYF4VwCkgJNOQFRKQQJUktVA7N15QDfAE8GF+NLARmvTs8e50cB43MvAMsA/wAJOQcJRQHRAfdxALsBYws1Caa3uQFR7S0AhwAZbwHbAo0A4QA5AIP1AVcAUQVd/QXXAlNNARU1HC9bZQG/AyMBNwERAH0Gz5GpzQsjBHEH1wIQHxXlAu8yB7kFAyLjE9FCyQK94lkAMhoKPAqrCqpgX2Q3CjV2PVQAEh+sPss/UgVVO1c7XDtXO1w7VztcO1c7XDtXO1wDm8Pmw+YKcF9JYe8Mqg3YRMw6TRPfYFVgNhPMLbsUxRXSJVoZQRrAJwkl6FUNDwgt12Y0CDA0eRfAAEMpbINFY4oeNApPHOtTlVT8LR8AtUumM7MNsBsZREQFS3XxYi4WEgomAmSFAmJGX1GzAV83JAKh+wJonAJmDQKfiDgfDwJmPwJmKgRyBIMDfxcDfpY5Cjl7GzmGOicnAmwhAjI6OA4CbcsCbbLzjgM3a0kvAWsA4gDlAE4JB5wMkQECD8YAEbkCdzMCdqZDAnlPRwJ4viFg30WyRvcCfEMCeswCfQ0CfPRIBEiBZygALxlJXEpfGRtK0ALRBQLQ0EsrA4hTA4fqRMmRNgLypV0HAwOyS9JMMSkH001QTbMCi0MCitzFHwshR2sJuwKOOwKOYESbhQKO3QKOYHxRuFM5AQ5S2FSJApP/ApMQAO0AIFUiVbNV1AosHymZijLleGpFPz0Cl6MC77ZYJawAXSkClpMCloCgAK1ZsFoNhVEAPwKWuQKWUlxIXNUCmc8CmWhczl0LHQKcnznGOqECnBoCn58CnryOACETNS4TAp31Ap6WALlBYThh8wKe1wKgcgGtAp6jIwKeUqljzGQrKS8CJ7MCJoICoP8CoFDbAqYzAqXSAqgDAIECp/ZogGi1AAdNaiBq1QKs5wKssgKtawKtBgJXIQJV4AKx5dsDH1JsmwKywRECsuwbbORtZ21MYwMl0QK2YD9DbpQDKUkCuGICuUsZArkue3A6cOUCvR0DLbYDMhUCvoxyBgMzdQK+HnMmc1MCw88CwwhzhnRPOUl05AM8qwEDPJ4DPcMCxYACxksCxhSNAshtVQLISALJUwLJMgJkoQLd1nh9ZXiyeSlL1AMYp2cGAmH4GfeVKHsPXpZevxUCz28Cz3AzT1fW9xejAMqxAs93AS3uA04Wfk8JAtwrAtuOAtJTA1JgA1NjAQUDVZCAjUMEzxrxZEl5A4LSg5EC2ssC2eKEFIRNp0ADhqkAMwNkEoZ1Xf0AWQLfaQLevHd7AuIz7RgB8zQrAfSfAfLWiwLr9wLpdH0DAur9AuroAP1LAb0C7o0C66CWrpcHAu5DA4XkmH1w5HGlAvMHAG0DjhqZlwL3FwORcgOSiwL3nAL53QL4apogmq+/O5siA52HAv7+AR8APZ8gAZ+3AwWRA6ZuA6bdANXJAwZuoYyiCQ0DDE0BEwEjB3EGZb1rCQC/BG/DFY8etxEAG3k9ACcDNxJRA42DAWcrJQCM8wAlAOanC6OVCLsGI6fJBgCvBRnDBvElRUYFFoAFcD9GSDNCKUK8X3kZX8QAls0FOgCQVCGbwTsuYDoZutcONxjOGJHJ/gVfBWAFXwVgBWsFYAVfBWAFXwVgBV8FYAVfBWBOHQjfjW8KCgoKbF7xMwTRA7kGN8PDAMMEr8MA70gxFroFTj5xPnhCR0K+X30/X/AAWBkzswCNBsxzzASm70aCRS4rDDMeLz49fnXfcsH5GcoscQFz13Y4HwVnBXLJycnACNdRYwgICAqEXoWTxgA7P4kACxbZBu21Kw0AjMsTAwkVAOVtJUUsJ1JCuULESUArXy9gPi9AKwnJRQYKTD9LPoA+iT54PnkCkULEUUpDX9NWV3JVEjQAc1w3A3IBE3YnX+g7QiMJb6MKaiszRCUuQrNCxDPMCcwEX9EWJzYREBEEBwIHKn6l33JCNVIfybPJtAltydPUCmhBZw/tEKsZAJOVJU1CLRuxbUHOQAo7P0s+eEJHHA8SJVRPdGM0NVrpvBoKhfUlM0JHHGUQUhEWO1xLSj8MO0ucNAqJIzVCRxv9EFsqKyA4OQgNj2nwZgp5ZNFgE2A1K3YHS2AhQQojJmC7DgpzGG1WYFUZCQYHZO9gHWCdYIVgu2BTYJlwFh8GvRbcXbG8YgtDHrMBwzPVyQonHQgkCyYBgQJ0Ajc4nVqIAwGSCsBPIgDsK3SWEtIVBa5N8gGjAo+kVwVIZwD/AEUSCDweX4ITrRQsJ8K3TwBXFDwEAB0TvzVcAtoTS20RIwDgVgZ9BBImYgA5AL4Coi8LFnezOkCnIQFjAY4KBAPh9RcGsgZSBsEAJctdsWIRu2kTkQstRw7DAcMBKgpPBGIGMDAwKCYnKTQaLg4AKRSVAFwCdl+YUZ0JdicFD3lPAdt1F9ZZKCGxuE3yBxkFVGcA/wBFEgiCBwAOLHQSjxOtQDg1z7deFRMAZ8QTAGtKb1ApIiPHADkAvgKiLy1DFtYCmBiDAlDDWNB0eo7fpaMO/aEVRRv0ATEQZBIODyMEAc8JQhCbDRgzFD4TAEMAu9YBCgCsAOkAm5I3ABwAYxvONnR+MhXJAxgKQyxL2+kkJhMbhQKDBMkSsvF0AD9BNQ6uQC7WqSQHwxEAEEIu1hkhAH2z4iQPwyJPHNWpdyYBRSpnJALzoBAEVPPsH20MxA0CCEQKRgAFyAtFAlMNwwjEDUQJRArELtapMg7DDZgJIw+TGukEIwvDFkMAqAtDEMMMBhioe+QAO3MMRAACrgnEBSPY9Q0FDnbSBoMAB8MSYxkSxAEJAPIJAAB8FWMOFtMc/HcXwxhDAC7DAvOowwAewwJdKDKHAAHDAALrFUQVwwAbwyvzpWMWv8wA/ABpAy++bcYDUKPD0KhDCwKmJ1MAAmMA5+UZwxAagwipBRL/eADfw6fDGOMCGsOjk3l6BwOpo4sAEsMOGxMAA5sAbcMOAAvDp0MJGkMDwgipnNIPAwfIqUMGAOGDAAPzABXDAAcDAAnDAGmTABrDAA7DChjDjnEWAwABYwAOcwAuUyYABsMAF8MIKQANUgC6wy4AA8MADqMq8wCyYgAcIwAB8wqpAAXOCx0V4wAHowBCwwEKAGnDAAuDAB3DAAjDCakABdIAbqcZ3QCZCCkABdIAAAFDAAfjAB2jCCkABqIACYMAGzMAbSMA5sOIAAhjAAhDABTDBAkpAAbSAOOTAAlDC6kOzPtnAAdDAG6kQFAATwAKwwwAA0MACbUDPwAHIwAZgwACE6cDAAojAApDAAoDp/MGwwAJIwADEwAQQwgAFEMAEXMAD5MADfMADcMAGRMOFiMAFUMAbqMWuwHDAMIAE0MLAGkzEgDhUwACQwAEWgAXgwUjAAbYABjDBSYBgzBaAEFNALcQBxUMegAwMngBrA0IZgJ0KxQHBREPd1N0ZzKRJwaIHAZqNT4DqQq8BwngAB4DAwt2AX56T1ocKQNXAh1GATQGC3tOxYNagkgAMQA5CQADAQEAWxLjAIOYNAEzAH7tFRk6TglSAF8NAAlYAQ+S1ACAQwQorQBiAN4dAJ1wPyeTANVzuQDX3AIeEMp9eyMgXiUAEdkBkJizKltbVVAaRMqRAAEAhyQ/SDEz6BmfVwB6ATEsOClKIRcDOF0E/832AFNt5AByAnkCRxGCOs94NjXdAwINGBonDBwPALW2AwICAgAAAAAAAAYDBQMDARrUAwAtAAAAAgEGBgYGBgYFBQUFBQUEBQYHCAkEBQUFBQQAAAICAAAAIgCNAJAAlT0A6gC7ANwApEQAwgCyAK0AqADuAKYA2gCjAOcBCAEDAMcAgQBiANIA1AEDAN4A8gCQAKkBMQDqAN8A3AsBCQ8yO9ra2tq8xuLT1tRJOB0BUgFcNU0BWgFpAWgBWwFMUUlLbhMBUxsNEAs6PhMOACcUKy0vMj5AQENDQ0RFFEYGJFdXV1dZWVhZL1pbXVxcI2NnZ2ZoZypsbnZ1eHh4eHh4enp6enp6enp6enp8fH18e2IARPIASQCaAHgAMgBm+ACOAFcAVwA3AnbvAIsABfj4AGQAk/IAnwBPAGIAZP//sACFAIUAaQBWALEAJAC2AIMCQAJDAPwA5wD+AP4A6AD/AOkA6QDoAOYALwJ7AVEBQAE+AVQBPgE+AT4BOQE4ATgBOAEcAVgXADEQCAEAUx8SHgsdHhYAjgCWAKYAUQBqIAIxAHYAbwCXAxUDJzIDIUlGTzEAkQJPAMcCVwKkAMAClgKWApYClgKWApYCiwKWApYClgKWApYClgKVApUCmAKgApcClgKWApQClAKUApQCkgKVAnUB1AKXAp8ClgKWApUeAIETBQD+DQOfAmECOh8BVBg9AuIZEjMbAU4/G1WZAXusRAFpYQEFA0FPAQYAmTEeIJdyADFoAHEANgCRA5zMk/C2jGINwjMWygIZCaXdfDILBCs5dAE7YnQBugDlhoiHhoiGiYqKhouOjIaNkI6Ij4qQipGGkoaThpSSlYaWhpeKmIaZhpqGm4aci52QnoqfhuIC4XTpAt90AIp0LHSoAIsAdHQEQwRABEIERQRDBEkERgRBBEcESQRIBEQERgRJAJ5udACrA490ALxuAQ10ANFZdHQA13QCFHQA/mJ0AP4BIQD+APwA/AD9APwDhGZ03ASMK23HAP4A/AD8AP0A/CR0dACRYnQA/gCRASEA/gCRAvQA/gCRA4RmdNwEjCttxyR0AP9idAEhAP4A/gD8APwA/QD8AP8A/AD8AP0A/AOEZnTcBIwrbcckdHQAkWJ0ASEA/gCRAP4AkQL0AP4AkQOEZnTcBIwrbcckdAJLAT50AlIBQXQCU8l0dAJfdHQDpgL0A6YDpgOnA6cDpwOnA4RmdNwEjCttxyR0dACRYnQBIQOmAJEDpgCRAvQDpgCRA4RmdNwEjCttxyR0BDh0AJEEOQCRDpU5dSgCADR03gV2CwArdAEFAM5iCnR0AF1iAAYcOgp0dACRCnQAXAEIwWZ0CnRmdHQAkWZ0CnRmdEXgAFF03gp0dEY0tlT2u3SOAQTwscwhjZZKrhYcBSfFp9XNbKiVDOD2b+cpe4/Z17mQnbtzzhaeQtE2GGj0IDNTjRUSyTxxw/RPHW/+vS7d1NfRt9z9QPZg4X7QFfhCnkvgNPIItOsC2eV6hPannZNHlZ9xrwZXIMOlu3jSoQSq78WEjwLjw1ELSlF1aBvfzwk5ZX7AUvQzjPQKbDuQ+sm4wNOp4A6AdVuRS0t1y/DZpg4R6m7FNjM9HgvW7Bi88zaMjOo6lM8wtBBdj8LP4ylv3zCXPhebMKJc066o9sF71oFW/8JXu86HJbwDID5lzw5GWLR/LhT0Qqnp2JQxNZNfcbLIzPy+YypqRm/lBmGmex+82+PisxUumSeJkALIT6rJezxMH+CTJmQtt5uwTVbL3ptmjDUQzlSIvWi8Tl7ng1NpuRn1Ng4n14Qc+3Iil7OwkvNWogLSPkn3pihIFytyIGmMhOe3n1tWsuMy9BdKyqF4Z3v2SgggTL9KVvMXPnCbRe+oOuFFP3HejBG/w9gvmfNYvg6JuWia2lcSSN1uIjBktzoIazOHPJZ7kKHPz8mRWVdW3lA8WGF9dQF6Bm673boov3BUWDU2JNcahR23GtfHKLOz/viZ+rYnZFaIznXO67CYEJ1fXuTRpZhYZkKe54xeoagkNGLs+NTZHE0rX45/XvQ2RGADX6vcAvdxIUBV27wxGm2zjZo4X3ILgAlrOFheuZ6wtsvaIj4yLY7qqawlliaIcrz2G+c3vscAnCkCuMzMmZvMfu9lLwTvfX+3cVSyPdN9ZwgDZhfjRgNJcLiJ67b9xx8JHswprbiE3v9UphotAPIgnXVIN5KmMc0piXhc6cChPnN+MRhG9adtdttQTTwSIpl8I4/j//d3sz1326qTBTpPRM/Hgh3kzqEXs8ZAk4ErQhNO8hzrQ0DLkWMA/N+91tn2MdOJnWC2FCZehkQrwzwbKOjhvZsbM95QoeL9skYyMf4srVPVJSgg7pOLUtr/n9eT99oe9nLtFRpjA9okV2Kj8h9k5HaC0oivRD8VyXkJ81tcd4fHNXPCfloIQasxsuO18/46dR2jgul/UIet2G0kRvnyONMKhHs6J26FEoqSqd+rfYjeEGwHWVDpX1fh1jBBcKGMqRepju9Y00mDVHC+Xdij/j44rKfvfjGinNs1jO/0F3jB83XCDINN/HB84axlP+3E/klktRo+vl3U/aiyMJbIodE1XSsDn6UAzIoMtUObY2+k/4gY/l+AkZJ5Sj2vQrkyLm3FoxjhDX+31UXBFf9XrAH31fFqoBmDEZvhvvpnZ87N+oZEu7U9O/nnk+QWj3x8uyoRbEnf+O5UMr9i0nHP38IF5AvzrBW8YWBUR0mIAzIvndQq9N3v/Jto3aPjPXUPl8ASdPPyAp7jENf8bk7VMM9ol9XGmlBmeDMuGqt+WzuL6CXAxXjIhCPM5vACchgMJ/8XBGLO/D1isVvGhwwHHr1DLaI5mn2Jr/b1pUD90uciDaS8cXNDzCWvNmT/PhQe5e8nTnnnkt8Ds/SIjibcum/fqDhKopxAY8AkSrPn+IGDEKOO+U3XOP6djFs2H5N9+orhOahiQk5KnEUWa+CzkVzhp8bMHRbg81qhjjXuIKbHjSLSIBKWqockGtKinY+z4/RdBUF6pcc3JmnlxVcNgrI4SEzKUZSwcD2QCyxzKve+gAmg6ZuSRkpPFa6mfThu7LJNu3H5K42uCpNvPAsoedolKV/LHe/eJ+BbaG5MG0NaSGVPRUmNFMFFSSpXEcXwbVh7UETOZZtoVNRGOIbbkig3McEtR68cG0RZAoJevWYo7Dg/lZ1CQzblWeUvVHmr8fY4Nqd9JJiH/zEX24mJviH60fAyFr0A3c4bC1j3yZU60VgJxXn8JgJXLUIsiBnmKmMYz+7yBQFBvqb2eYnuW59joZBf56/wXvWIR4R8wTmV80i1mZy+S4+BUES+hzjk0uXpC///z/IlqHZ1monzlXp8aCfhGKMti73FI1KbL1q6IKO4fuBuZ59gagjn5xU79muMpHXg6S+e+gDM/U9BKLHbl9l6o8czQKl4RUkJJiqftQG2i3BMg/TQlUYFkJDYBOOvAugYuzYSDnZbDDd/aSd9x0Oe6F+bJcHfl9+gp6L5/TgA+BdFFovbfCrQ40s5vMPw8866pNX8zyFGeFWdxIpPVp9Rg1UPOVFbFZrvaFq/YAzHQgqMWpahMYfqHpmwXfHL1/kpYmGuHFwT55mQu0dylfNuq2Oq0hTMCPwqfxnuBIPLXfci4Y1ANy+1CUipQxld/izVh16WyG2Q0CQQ9NqtAnx1HCHwDj7sYxOSB0wopZSnOzxQOcExmxrVTF2BkOthVpGfuhaGECfCJpJKpjnihY+xOT2QJxN61+9K6QSqtv2Shr82I3jgJrqBg0wELFZPjvHpvzTtaJnLK6Vb97Yn933koO/saN7fsjwNKzp4l2lJVx2orjCGzC/4ZL4zCver6aQYtC5sdoychuFE6ufOiog+VWi5UDkbmvmtah/3aArEBIi39s5ILUnlFLgilcGuz9CQshEY7fw2ouoILAYPVT/gyAIq3TFAIwVsl+ktkRz/qGfnCDGrm5gsl/l9QdvCWGsjPz3dU7XuqKfdUrr/6XIgjp4rey6AJBmCmUJMjITHVdFb5m1p+dLMCL8t55zD42cmftmLEJC0Da04YiRCVUBLLa8D071/N5UBNBXDh0LFsmhV/5B5ExOB4j3WVG/S3lfK5o+V6ELHvy6RR9n4ac+VsK4VE4yphPvV+kG9FegTBH4ZRXL2HytUHCduJazB/KykjfetYxOXTLws267aGOd+I+JhKP//+VnXmS90OD/jvLcVu0asyqcuYN1mSb6XTlCkqv1vigZPIYwNF/zpWcT1GR/6aEIRjkh0yhg4LXJfaGobYJTY4JI58KiAKgmmgAKWdl5nYCeLqavRJGQNuYuZtZFGx+IkI4w4NS2xwbetNMunOjBu/hmKCI/w7tfiiyUd//4rbTeWt4izBY8YvGIN6vyKYmP/8X8wHKCeN+WRcKM70+tXKNGyevU9H2Dg5BsljnTf8YbsJ1TmMs74Ce2XlHisleguhyeg44rQOHZuw/6HTkhnnurK2d62q6yS7210SsAIaR+jXMQA+svkrLpsUY+F30Uw89uOdGAR6vo4FIME0EfVVeHTu6eKicfhSqOeXJhbftcd08sWEnNUL1C9fnprTgd83IMut8onVUF0hvqzZfHduPjbjwEXIcoYmy+P6tcJZHmeOv6VrvEdkHDJecjHuHeWANe79VG662qTjA/HCvumVv3qL+LrOcpqGps2ZGwQdFJ7PU4iuyRlBrwfO+xnPyr47s2cXVbWzAyznDiBGjCM3ksxjjqM62GE9C8f5U38kB3VjtabKp/nRdvMESPGDG90bWRLAt1Qk5DyLuazRR1YzdC1c+hZXvAWV8xA72S4A8B67vjVhbba3MMop293FeEXpe7zItMWrJG/LOH9ByOXmYnNJfjmfuX9KbrpgLOba4nZ+fl8Gbdv/ihv+6wFGKHCYrVwmhFC0J3V2bn2tIB1wCc1CST3d3X2OyxhguXcs4sm679UngzofuSeBewMFJboIQHbUh/m2JhW2hG9DIvG2t7yZIzKBTz9wBtnNC+2pCRYhSIuQ1j8xsz5VvqnyUIthvuoyyu7fNIrg/KQUVmGQaqkqZk/Vx5b33/gsEs8yX7SC1J+NV4icz6bvIE7C5G6McBaI8rVg56q5QBJWxn/87Q1sPK4+sQa8fLU5gXo4paaq4cOcQ4wR0VBHPGjKh+UlPCbA1nLXyEUX45qZ8J7/Ln4FPJE2TdzD0Z8MLSNQiykMMmSyOCiFfy84Rq60emYB2vD09KjYwsoIpeDcBDTElBbXxND72yhd9pC/1CMid/5HUMvAL27OtcIJDzNKpRPNqPOpyt2aPGz9QWIs9hQ9LiX5s8m9hjTUu/f7MyIatjjd+tSfQ3ufZxPpmJhTaBtZtKLUcfOCUqADuO+QoH8B9v6U+P0HV1GLQmtoNFTb3s74ivZgjES0qfK+8RdGgBbcCMSy8eBvh98+et1KIFqSe1KQPyXULBMTsIYnysIwiZBJYdI20vseV+wuJkcqGemehKjaAb9L57xZm3g2zX0bZ2xk/fU+bCo7TlnbW7JuF1YdURo/2Gw7VclDG1W7LOtas2LX4upifZ/23rzpsnY/ALfRgrcWP5hYmV9VxVOQA1fZvp9F2UNU+7d7xRyVm5wiLp3/0dlV7vdw1PMiZrbDAYzIVqEjRY2YU03sJhPnlwIPcZUG5ltL6S8XCxU1eYS5cjr34veBmXAvy7yN4ZjArIG0dfD/5UpBNlX1ZPoxJOwyqRi3wQWtOzd4oNKh0LkoTm8cwqgIfKhqqGOhwo71I+zXnMemTv2B2AUzABWyFztGgGULjDDzWYwJUVBTjKCn5K2QGMK1CQT7SzziOjo+BhAmqBjzuc3xYym2eedGeOIRJVyTwDw37iCMe4g5Vbnsb5ZBdxOAnMT7HU4DHpxWGuQ7GeiY30Cpbvzss55+5Km1YsbD5ea3NI9QNYIXol5apgSu9dZ8f8xS5dtHpido5BclDuLWY4lhik0tbJa07yJhH0BOyEut/GRbYTS6RfiTYWGMCkNpfSHi7HvdiTglEVHKZXaVhezH4kkXiIvKopYAlPusftpE4a5IZwvw1x/eLvoDIh/zpo9FiQInsTb2SAkKHV42XYBjpJDg4374XiVb3ws4qM0s9eSQ5HzsMU4OZJKuopFjBM+dAZEl8RUMx5uU2N486Kr141tVsGQfGjORYMCJAMsxELeNT4RmWjRcpdTGBwcx6XN9drWqPmJzcrGrH4+DRc7+n1w3kPZwu0BkNr6hQrqgo7JTB9A5kdJ/H7P4cWBMwsmuixAzJB3yrQpnGIq90lxAXLzDCdn1LPibsRt7rHNjgQBklRgPZ8vTbjXdgXrTWQsK5MdrXXQVPp0Rinq3frzZKJ0qD6Qhc40VzAraUXlob1gvkhK3vpmHgI6FRlQZNx6eRqkp0zy4AQlX813fAPtL3jMRaitGFFjo0zmErloC+h+YYdVQ6k4F/epxAoF0BmqEoKNTt6j4vQZNQ2BoqF9Vj53TOIoNmDiu9Xp15RkIgQIGcoLpfoIbenzpGUAtqFJp5W+LLnx38jHeECTJ/navKY1NWfN0sY1T8/pB8kIH3DU3DX+u6W3YwpypBMYOhbSxGjq84RZ84fWJow8pyHqn4S/9J15EcCMsXqrfwyd9mhiu3+rEo9pPpoJkdZqHjra4NvzFwuThNKy6hao/SlLw3ZADUcUp3w3SRVfW2rhl80zOgTYnKE0Hs2qp1J6H3xqPqIkvUDRMFDYyRbsFI3M9MEyovPk8rlw7/0a81cDVLmBsR2ze2pBuKb23fbeZC0uXoIvDppfTwIDxk1Oq2dGesGc+oJXWJLGkOha3CX+DUnzgAp9HGH9RsPZN63Hn4RMA5eSVhPHO+9RcRb/IOgtW31V1Q5IPGtoxPjC+MEJbVlIMYADd9aHYWUIQKopuPOHmoqSkubnAKnzgKHqgIOfW5RdAgotN6BN+O2ZYHkuemLnvQ8U9THVrS1RtLmKbcC7PeeDsYznvqzeg6VCNwmr0Yyx1wnLjyT84BZz3EJyCptD3yeueAyDWIs0L2qs/VQ3HUyqfrja0V1LdDzqAikeWuV4sc7RLIB69jEIBjCkyZedoUHqCrOvShVzyd73OdrJW0hPOuQv2qOoHDc9xVb6Yu6uq3Xqp2ZaH46A7lzevbxQEmfrzvAYSJuZ4WDk1Hz3QX1LVdiUK0EvlAGAYlG3Md30r7dcPN63yqBCIj25prpvZP0nI4+EgWoFG95V596CurXpKRBGRjQlHCvy5Ib/iW8nZJWwrET3mgd6mEhfP4KCuaLjopWs7h+MdXFdIv8dHQJgg1xi1eYqB0uDYjxwVmri0Sv5XKut/onqapC+FQiC2C1lvYJ9MVco6yDYsS3AANUfMtvtbYI2hfwZatiSsnoUeMZd34GVjkMMKA+XnjJpXgRW2SHTZplVowPmJsvXy6w3cfO1AK2dvtZEKTkC/TY9LFiKHCG0DnrMQdGm2lzlBHM9iEYynH2UcVMhUEjsc0oDBTgo2ZSQ1gzkAHeWeBXYFjYLuuf8yzTCy7/RFR81WDjXMbq2BOH5dURnxo6oivmxL3cKzKInlZkD31nvpHB9Kk7GfcfE1t+1V64b9LtgeJGlpRFxQCAqWJ5DoY77ski8gsOEOr2uywZaoO/NGa0X0y1pNQHBi3b2SUGNpcZxDT7rLbBf1FSnQ8guxGW3W+36BW0gBje4DOz6Ba6SVk0xiKgt+q2JOFyr4SYfnu+Ic1QZYIuwHBrgzr6UvOcSCzPTOo7D6IC4ISeS7zkl4h+2VoeHpnG/uWR3+ysNgPcOIXQbv0n4mr3BwQcdKJxgPSeyuP/z1Jjg4e9nUvoXegqQVIE30EHx5GHv+FAVUNTowYDJgyFhf5IvlYmEqRif6+WN1MkEJmDcQITx9FX23a4mxy1AQRsOHO/+eImX9l8EMJI3oPWzVXxSOeHU1dUWYr2uAA7AMb+vAEZSbU3qob9ibCyXeypEMpZ6863o6QPqlqGHZkuWABSTVNd4cOh9hv3qEpSx2Zy/DJMP6cItEmiBJ5PFqQnDEIt3NrA3COlOSgz43D7gpNFNJ5MBh4oFzhDPiglC2ypsNU4ISywY2erkyb1NC3Qh/IfWj0eDgZI4/ln8WPfBsT3meTjq1Uqt1E7Zl/qftqkx6aM9KueMCekSnMrcHj1CqTWWzEzPsZGcDe3Ue4Ws+XFYVxNbOFF8ezkvQGR6ZOtOLU2lQEnMBStx47vE6Pb7AYMBRj2OOfZXfisjJnpTfSNjo6sZ6qSvNxZNmDeS7Gk3yYyCk1HtKN2UnhMIjOXUzAqDv90lx9O/q/AT1ZMnit5XQe9wmQxnE/WSH0CqZ9/2Hy+Sfmpeg8RwsHI5Z8kC8H293m/LHVVM/BA7HaTJYg5Enk7M/xWpq0192ACfBai2LA/qrCjCr6Dh1BIMzMXINBmX96MJ5Hn2nxln/RXPFhwHxUmSV0EV2V0jm86/dxxuYSU1W7sVkEbN9EzkG0QFwPhyHKyb3t+Fj5WoUUTErcazE/N6EW6Lvp0d//SDPj7EV9UdJN+Amnf3Wwk3A0SlJ9Z00yvXZ7n3z70G47Hfsow8Wq1JXcfwnA+Yxa5mFsgV464KKP4T31wqIgzFPd3eCe3j5ory5fBF2hgCFyVFrLzI9eetNXvM7oQqyFgDo4CTp/hDV9NMX9JDHQ/nyHTLvZLNLF6ftn2OxjGm8+PqOwhxnPHWipkE/8wbtyri80Sr7pMNkQGMfo4ZYK9OcCC4ESVFFbLMIvlxSoRqWie0wxqnLfcLSXMSpMMQEJYDVObYsXIQNv4TGNwjq1kvT1UOkicTrG3IaBZ3XdScS3u8sgeZPVpOLkbiF940FjbCeNRINNvDbd01EPBrTCPpm12m43ze1bBB59Ia6Ovhnur/Nvx3IxwSWol+3H2qfCJR8df6aQf4v6WiONxkK+IqT4pKQrZK/LplgDI/PJZbOep8dtbV7oCr6CgfpWa8NczOkPx81iSHbsNhVSJBOtrLIMrL31LK9TqHqAbAHe0RLmmV806kRLDLNEhUEJfm9u0sxpkL93Zgd6rw+tqBfTMi59xqXHLXSHwSbSBl0EK0+loECOPtrl+/nsaFe197di4yUgoe4jKoAJDXc6DGDjrQOoFDWZJ9HXwt8xDrQP+7aRwWKWI1GF8s8O4KzxWBBcwnl3vnl1Oez3oh6Ea1vjR7/z7DDTrFtqU2W/KAEzAuXDNZ7MY73MF216dzdSbWmUp4lcm7keJfWaMHgut9x5C9mj66Z0lJ+yhsjVvyiWrfk1lzPOTdhG15Y7gQlXtacvI7qv/XNSscDwqkgwHT/gUsD5yB7LdRRvJxQGYINn9hTpodKFVSTPrtGvyQw+HlRFXIkodErAGu9Iy1YpfSPc3jkFh5CX3lPxv7aqjE/JAfTIpEjGb/H7MO0e2vsViSW1qa/Lmi4/n4DEI3g7lYrcanspDfEpKkdV1OjSLOy0BCUqVoECaB55vs06rXl4jqmLsPsFM/7vYJ0vrBhDCm/00A/H81l1uekJ/6Lml3Hb9+NKiLqATJmDpyzfYZFHumEjC662L0Bwkxi7E9U4cQA0XMVDuMYAIeLMPgQaMVOd8fmt5SflFIfuBoszeAw7ow5gXPE2Y/yBc/7jExARUf/BxIHQBF5Sn3i61w4z5xJdCyO1F1X3+3ax+JSvMeZ7S6QSKp1Fp/sjYz6Z+VgCZzibGeEoujryfMulH7Rai5kAft9ebcW50DyJr2uo2z97mTWIu45YsSnNSMrrNUuG1XsYBtD9TDYzQffKB87vWbkM4EbPAFgoBV4GQS+vtFDUqOFAoi1nTtmIOvg38N4hT2Sn8r8clmBCXspBlMBYTnrqFJGBT3wZOzAyJDre9dHH7+x7qaaKDOB4UQALD5ecS0DE4obubQEiuJZ0EpBVpLuYcce8Aa4PYd/V4DLDAJBYKQPCWTcrEaZ5HYbJi11Gd6hjGom1ii18VHYnG28NKpkz2UKVPxlhYSp8uZr367iOmoy7zsxehW9wzcy2zG0a80PBMCRQMb32hnaHeOR8fnNDzZhaNYhkOdDsBUZ3loDMa1YP0uS0cjUP3b/6DBlqmZOeNABDsLl5BI5QJups8uxAuWJdkUB/pO6Zax6tsg7fN5mjjDgMGngO+DPcKqiHIDbFIGudxtPTIyDi9SFMKBDcfdGQRv41q1AqmxgkVfJMnP8w/Bc7N9/TR6C7mGObFqFkIEom8sKi2xYqJLTCHK7cxzaZvqODo22c3wisBCP4HeAgcRbNPAsBkNRhSmD48dHupdBRw4mIvtS5oeF6zeT1KMCyhMnmhpkFAGWnGscoNkwvQ8ZM5lE/vgTHFYL99OuNxdFBxTEDd5v2qLR8y9WkXsWgG6kZNndFG+pO/UAkOCipqIhL3hq7cRSdrCq7YhUsTocEcnaFa6nVkhnSeRYUA1YO0z5itF9Sly3VlxYDw239TJJH6f3EUfYO5lb7bcFcz8Bp7Oo8QmnsUHOz/fagVUBtKEw1iT88j+aKkv8cscKNkMxjYr8344D1kFoZ7/td1W6LCNYN594301tUGRmFjAzeRg5vyoM1F6+bJZ/Q54jN/k8SFd3DxPTYaAUsivsBfgTn7Mx8H2SpPt4GOdYRnEJOH6jHM2p6SgB0gzIRq6fHxGMmSmqaPCmlfwxiuloaVIitLGN8wie2CDWhkzLoCJcODh7KIOAqbHEvXdUxaS4TTTs07Clzj/6GmVs9kiZDerMxEnhUB6QQPlcfqkG9882RqHoLiHGBoHfQuXIsAG8GTAtao2KVwRnvvam8jo1e312GQAKWEa4sUVEAMG4G6ckcONDwRcg1e2D3+ohXgY4UAWF8wHKQMrSnzCgfFpsxh+aHXMGtPQroQasRY4U6UdG0rz1Vjbka0MekOGRZQEvqQFlxseFor8zWFgHek3v29+WqN6gaK5gZOTOMZzpQIC1201LkMCXild3vWXSc5UX9xcFYfbRPzGFa1FDcPfPB/jUEq/FeGt419CI3YmBlVoHsa4KdcwQP5ZSwHHhFJ7/Ph/Rap/4vmG91eDwPP0lDfCDRCLszTqfzM71xpmiKi2HwS4WlqvGNwtvwF5Dqpn6KTq8ax00UMPkxDcZrEEEsIvHiUXXEphdb4GB4FymlPwBz4Gperqq5pW7TQ6/yNRhW8VT5NhuP0udlxo4gILq5ZxAZk8ZGh3g4CqxJlPKY7AQxupfUcVpWT5VItp1+30UqoyP4wWsRo3olRRgkWZZ2ZN6VC3OZFeXB8NbnUrSdikNptD1QiGuKkr8EmSR/AK9Rw+FF3s5uwuPbvHGiPeFOViltMK7AUaOsq9+x9cndk3iJEE5LKZRlWJbKOZweROzmPNVPkjE3K/TyA57Rs68TkZ3MR8akKpm7cFjnjPd/DdkWjgYoKHSr5Wu5ssoBYU4acRs5g2DHxUmdq8VXOXRbunD8QN0LhgkssgahcdoYsNvuXGUK/KXD/7oFb+VGdhqIn02veuM5bLudJOc2Ky0GMaG4W/xWBxIJcL7yliJOXOpx0AkBqUgzlDczmLT4iILXDxxtRR1oZa2JWFgiAb43obrJnG/TZC2KSK2wqOzRZTXavZZFMb1f3bXvVaNaK828w9TO610gk8JNf3gMfETzXXsbcvRGCG9JWQZ6+cDPqc4466Yo2RcKH+PILeKOqtnlbInR3MmBeGG3FH10yzkybuqEC2HSQwpA0An7d9+73BkDUTm30bZmoP/RGbgFN+GrCOfADgqr0WbI1a1okpFms8iHYw9hm0zUvlEMivBRxModrbJJ+9/p3jUdQQ9BCtQdxnOGrT5dzRUmw0593/mbRSdBg0nRvRZM5/E16m7ZHmDEtWhwvfdZCZ8J8M12W0yRMszXamWfQTwIZ4ayYktrnscQuWr8idp3PjT2eF/jmtdhIfcpMnb+IfZY2FebW6UY/AK3jP4u3Tu4zE4qlnQgLFbM19EBIsNf7KhjdbqQ/D6yiDb+NlEi2SKD+ivXVUK8ib0oBo366gXkR8ZxGjpJIDcEgZPa9TcYe0TIbiPl/rPUQDu3XBJ9X/GNq3FAUsKsll57DzaGMrjcT+gctp+9MLYXCq+sqP81eVQ0r9lt+gcQfZbACRbEjvlMskztZG8gbC8Qn9tt26Q7y7nDrbZq/LEz7kR6Jc6pg3N9rVX8Y5MJrGlML9p9lU4jbTkKqCveeZUJjHB03m2KRKR2TytoFkTXOLg7keU1s1lrPMQJpoOKLuAAC+y1HlJucU6ysB5hsXhvSPPLq5J7JtnqHKZ4vYjC4Vy8153QY+6780xDuGARsGbOs1WqzH0QS765rnSKEbbKlkO8oI/VDwUd0is13tKpqILu1mDJFNy/iJAWcvDgjxvusIT+PGz3ST/J9r9Mtfd0jpaGeiLYIqXc7DiHSS8TcjFVksi66PEkxW1z6ujbLLUGNNYnzOWpH8BZGK4bCK7iR+MbIv8ncDAz1u4StN3vTTzewr9IQjk9wxFxn+6N1ddKs0vffJiS08N3a4G1SVrlZ97Q/M+8G9fe5AP6d9/Qq4WRnORVhofPIKEdCr3llspUfE0oKIIYoByBRPh+bX1HLS3JWGJRhIvE1aW4NTd8ePi4Z+kXb+Z8snYfSNcqijhAgVsx4RCM54cXUiYkjeBmmC4ajOHrChoELscJJC7+9jjMjw5BagZKlgRMiSNYz7h7vvZIoQqbtQmspc0cUk1G/73iXtSpROl5wtLgQi0mW2Ex8i3WULhcggx6E1LMVHUsdc9GHI1PH3U2Ko0PyGdn9KdVOLm7FPBui0i9a0HpA60MsewVE4z8CAt5d401Gv6zXlIT5Ybit1VIA0FCs7wtvYreru1fUyW3oLAZ/+aTnZrOcYRNVA8spoRtlRoWflsRClFcgzkqiHOrf0/SVw+EpVaFlJ0g4Kxq1MMOmiQdpMNpte8lMMQqm6cIFXlnGbfJllysKDi+0JJMotkqgIxOSQgU9dn/lWkeVf8nUm3iwX2Nl3WDw9i6AUK3vBAbZZrcJpDQ/N64AVwjT07Jef30GSSmtNu2WlW7YoyW2FlWfZFQUwk867EdLYKk9VG6JgEnBiBxkY7LMo4YLQJJlAo9l/oTvJkSARDF/XtyAzM8O2t3eT/iXa6wDN3WewNmQHdPfsxChU/KtLG2Mn8i4ZqKdSlIaBZadxJmRzVS/o4yA65RTSViq60oa395Lqw0pzY4SipwE0SXXsKV+GZraGSkr/RW08wPRvqvSUkYBMA9lPx4m24az+IHmCbXA+0faxTRE9wuGeO06DIXa6QlKJ3puIyiuAVfPr736vzo2pBirS+Vxel3TMm3JKhz9o2ZoRvaFVpIkykb0Hcm4oHFBMcNSNj7/4GJt43ogonY2Vg4nsDQIWxAcorpXACzgBqQPjYsE/VUpXpwNManEru4NwMCFPkXvMoqvoeLN3qyu/N1eWEHttMD65v19l/0kH2mR35iv/FI+yjoHJ9gPMz67af3Mq/BoWXqu3rphiWMXVkmnPSEkpGpUI2h1MThideGFEOK6YZHPwYzMBvpNC7+ZHxPb7epfefGyIB4JzO9DTNEYnDLVVHdQyvOEVefrk6Uv5kTQYVYWWdqrdcIl7yljwwIWdfQ/y+2QB3eR/qxYObuYyB4gTbo2in4PzarU1sO9nETkmj9/AoxDA+JM3GMqQtJR4jtduHtnoCLxd1gQUscHRB/MoRYIEsP2pDZ9KvHgtlk1iTbWWbHhohwFEYX7y51fUV2nuUmnoUcqnWIQAAgl9LTVX+Bc0QGNEhChxHR4YjfE51PUdGfsSFE6ck7BL3/hTf9jLq4G1IafINxOLKeAtO7quulYvH5YOBc+zX7CrMgWnW47/jfRsWnJjYYoE7xMfWV2HN2iyIqLI';
  7. const FENCED = new Map([[8217,"apostrophe"],[8260,"fraction slash"],[12539,"middle dot"]]);
  8. const NSM_MAX = 4;
  9. function decode_arithmetic(bytes) {
  10. let pos = 0;
  11. function u16() { return (bytes[pos++] << 8) | bytes[pos++]; }
  12. // decode the frequency table
  13. let symbol_count = u16();
  14. let total = 1;
  15. let acc = [0, 1]; // first symbol has frequency 1
  16. for (let i = 1; i < symbol_count; i++) {
  17. acc.push(total += u16());
  18. }
  19. // skip the sized-payload that the last 3 symbols index into
  20. let skip = u16();
  21. let pos_payload = pos;
  22. pos += skip;
  23. let read_width = 0;
  24. let read_buffer = 0;
  25. function read_bit() {
  26. if (read_width == 0) {
  27. // this will read beyond end of buffer
  28. // but (undefined|0) => zero pad
  29. read_buffer = (read_buffer << 8) | bytes[pos++];
  30. read_width = 8;
  31. }
  32. return (read_buffer >> --read_width) & 1;
  33. }
  34. const N = 31;
  35. const FULL = 2**N;
  36. const HALF = FULL >>> 1;
  37. const QRTR = HALF >> 1;
  38. const MASK = FULL - 1;
  39. // fill register
  40. let register = 0;
  41. for (let i = 0; i < N; i++) register = (register << 1) | read_bit();
  42. let symbols = [];
  43. let low = 0;
  44. let range = FULL; // treat like a float
  45. while (true) {
  46. let value = Math.floor((((register - low + 1) * total) - 1) / range);
  47. let start = 0;
  48. let end = symbol_count;
  49. while (end - start > 1) { // binary search
  50. let mid = (start + end) >>> 1;
  51. if (value < acc[mid]) {
  52. end = mid;
  53. } else {
  54. start = mid;
  55. }
  56. }
  57. if (start == 0) break; // first symbol is end mark
  58. symbols.push(start);
  59. let a = low + Math.floor(range * acc[start] / total);
  60. let b = low + Math.floor(range * acc[start+1] / total) - 1;
  61. while (((a ^ b) & HALF) == 0) {
  62. register = (register << 1) & MASK | read_bit();
  63. a = (a << 1) & MASK;
  64. b = (b << 1) & MASK | 1;
  65. }
  66. while (a & ~b & QRTR) {
  67. register = (register & HALF) | ((register << 1) & (MASK >>> 1)) | read_bit();
  68. a = (a << 1) ^ HALF;
  69. b = ((b ^ HALF) << 1) | HALF | 1;
  70. }
  71. low = a;
  72. range = 1 + b - a;
  73. }
  74. let offset = symbol_count - 4;
  75. return symbols.map(x => { // index into payload
  76. switch (x - offset) {
  77. case 3: return offset + 0x10100 + ((bytes[pos_payload++] << 16) | (bytes[pos_payload++] << 8) | bytes[pos_payload++]);
  78. case 2: return offset + 0x100 + ((bytes[pos_payload++] << 8) | bytes[pos_payload++]);
  79. case 1: return offset + bytes[pos_payload++];
  80. default: return x - 1;
  81. }
  82. });
  83. }
  84. // returns an iterator which returns the next symbol
  85. function read_payload(v) {
  86. let pos = 0;
  87. return () => v[pos++];
  88. }
  89. function read_compressed_payload(s) {
  90. return read_payload(decode_arithmetic(unsafe_atob(s)));
  91. }
  92. // unsafe in the sense:
  93. // expected well-formed Base64 w/o padding
  94. // 20220922: added for https://github.com/adraffy/ens-normalize.js/issues/4
  95. function unsafe_atob(s) {
  96. let lookup = [];
  97. [...'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/'].forEach((c, i) => lookup[c.charCodeAt(0)] = i);
  98. let n = s.length;
  99. let ret = new Uint8Array((6 * n) >> 3);
  100. for (let i = 0, pos = 0, width = 0, carry = 0; i < n; i++) {
  101. carry = (carry << 6) | lookup[s.charCodeAt(i)];
  102. width += 6;
  103. if (width >= 8) {
  104. ret[pos++] = (carry >> (width -= 8));
  105. }
  106. }
  107. return ret;
  108. }
  109. // eg. [0,1,2,3...] => [0,-1,1,-2,...]
  110. function signed(i) {
  111. return (i & 1) ? (~i >> 1) : (i >> 1);
  112. }
  113. function read_deltas(n, next) {
  114. let v = Array(n);
  115. for (let i = 0, x = 0; i < n; i++) v[i] = x += signed(next());
  116. return v;
  117. }
  118. // [123][5] => [0 3] [1 1] [0 0]
  119. function read_sorted(next, prev = 0) {
  120. let ret = [];
  121. while (true) {
  122. let x = next();
  123. let n = next();
  124. if (!n) break;
  125. prev += x;
  126. for (let i = 0; i < n; i++) {
  127. ret.push(prev + i);
  128. }
  129. prev += n + 1;
  130. }
  131. return ret;
  132. }
  133. function read_sorted_arrays(next) {
  134. return read_array_while(() => {
  135. let v = read_sorted(next);
  136. if (v.length) return v;
  137. });
  138. }
  139. // returns map of x => ys
  140. function read_mapped(next) {
  141. let ret = [];
  142. while (true) {
  143. let w = next();
  144. if (w == 0) break;
  145. ret.push(read_linear_table(w, next));
  146. }
  147. while (true) {
  148. let w = next() - 1;
  149. if (w < 0) break;
  150. ret.push(read_replacement_table(w, next));
  151. }
  152. return ret.flat();
  153. }
  154. // read until next is falsy
  155. // return array of read values
  156. function read_array_while(next) {
  157. let v = [];
  158. while (true) {
  159. let x = next(v.length);
  160. if (!x) break;
  161. v.push(x);
  162. }
  163. return v;
  164. }
  165. // read w columns of length n
  166. // return as n rows of length w
  167. function read_transposed(n, w, next) {
  168. let m = Array(n).fill().map(() => []);
  169. for (let i = 0; i < w; i++) {
  170. read_deltas(n, next).forEach((x, j) => m[j].push(x));
  171. }
  172. return m;
  173. }
  174. // returns [[x, ys], [x+dx, ys+dy], [x+2*dx, ys+2*dy], ...]
  175. // where dx/dy = steps, n = run size, w = length of y
  176. function read_linear_table(w, next) {
  177. let dx = 1 + next();
  178. let dy = next();
  179. let vN = read_array_while(next);
  180. let m = read_transposed(vN.length, 1+w, next);
  181. return m.flatMap((v, i) => {
  182. let [x, ...ys] = v;
  183. return Array(vN[i]).fill().map((_, j) => {
  184. let j_dy = j * dy;
  185. return [x + j * dx, ys.map(y => y + j_dy)];
  186. });
  187. });
  188. }
  189. // return [[x, ys...], ...]
  190. // where w = length of y
  191. function read_replacement_table(w, next) {
  192. let n = 1 + next();
  193. let m = read_transposed(n, 1+w, next);
  194. return m.map(v => [v[0], v.slice(1)]);
  195. }
  196. function read_trie(next) {
  197. let ret = [];
  198. let sorted = read_sorted(next);
  199. expand(decode([]), []);
  200. return ret; // not sorted
  201. function decode(Q) { // characters that lead into this node
  202. let S = next(); // state: valid, save, check
  203. let B = read_array_while(() => { // buckets leading to new nodes
  204. let cps = read_sorted(next).map(i => sorted[i]);
  205. if (cps.length) return decode(cps);
  206. });
  207. return {S, B, Q};
  208. }
  209. function expand({S, B}, cps, saved) {
  210. if (S & 4 && saved === cps[cps.length-1]) return;
  211. if (S & 2) saved = cps[cps.length-1];
  212. if (S & 1) ret.push(cps);
  213. for (let br of B) {
  214. for (let cp of br.Q) {
  215. expand(br, [...cps, cp], saved);
  216. }
  217. }
  218. }
  219. }
  220. function hex_cp(cp) {
  221. return cp.toString(16).toUpperCase().padStart(2, '0');
  222. }
  223. function quote_cp(cp) {
  224. return `{${hex_cp(cp)}}`; // raffy convention: like "\u{X}" w/o the "\u"
  225. }
  226. /*
  227. export function explode_cp(s) {
  228. return [...s].map(c => c.codePointAt(0));
  229. }
  230. */
  231. function explode_cp(s) { // this is about 2x faster
  232. let cps = [];
  233. for (let pos = 0, len = s.length; pos < len; ) {
  234. let cp = s.codePointAt(pos);
  235. pos += cp < 0x10000 ? 1 : 2;
  236. cps.push(cp);
  237. }
  238. return cps;
  239. }
  240. function str_from_cps(cps) {
  241. const chunk = 4096;
  242. let len = cps.length;
  243. if (len < chunk) return String.fromCodePoint(...cps);
  244. let buf = [];
  245. for (let i = 0; i < len; ) {
  246. buf.push(String.fromCodePoint(...cps.slice(i, i += chunk)));
  247. }
  248. return buf.join('');
  249. }
  250. function compare_arrays(a, b) {
  251. let n = a.length;
  252. let c = n - b.length;
  253. for (let i = 0; c == 0 && i < n; i++) c = a[i] - b[i];
  254. return c;
  255. }
  256. // reverse polyfill
  257. // replace custom nf implementation with system implementation
  258. // (saves approximately 6KB)
  259. function nf(cps, form) {
  260. return explode_cp(str_from_cps(cps).normalize(form));
  261. }
  262. function nfc(cps) {
  263. return nf(cps, 'NFC');
  264. }
  265. function nfd(cps) {
  266. return nf(cps, 'NFD');
  267. }
  268. const HYPHEN = 0x2D;
  269. const STOP = 0x2E;
  270. const STOP_CH = '.';
  271. const FE0F = 0xFE0F;
  272. const UNIQUE_PH = 1;
  273. // 20230913: replace [...v] with Array_from(v) to avoid large spreads
  274. const Array_from = x => Array.from(x); // Array.from.bind(Array);
  275. function group_has_cp(g, cp) {
  276. // 20230913: keep primary and secondary distinct instead of creating valid union
  277. return g.P.has(cp) || g.Q.has(cp);
  278. }
  279. class Emoji extends Array {
  280. get is_emoji() { return true; } // free tagging system
  281. }
  282. let MAPPED, IGNORED, CM, NSM, ESCAPE, NFC_CHECK, GROUPS, WHOLE_VALID, WHOLE_MAP, VALID, EMOJI_LIST, EMOJI_ROOT;
  283. function init() {
  284. if (MAPPED) return;
  285. let r = read_compressed_payload(COMPRESSED);
  286. const read_sorted_array = () => read_sorted(r);
  287. const read_sorted_set = () => new Set(read_sorted_array());
  288. const set_add_many = (set, v) => v.forEach(x => set.add(x));
  289. MAPPED = new Map(read_mapped(r));
  290. IGNORED = read_sorted_set(); // ignored characters are not valid, so just read raw codepoints
  291. /*
  292. // direct include from payload is smaller than the decompression code
  293. const FENCED = new Map(read_array_while(() => {
  294. let cp = r();
  295. if (cp) return [cp, read_str(r())];
  296. }));
  297. */
  298. // 20230217: we still need all CM for proper error formatting
  299. // but norm only needs NSM subset that are potentially-valid
  300. CM = read_sorted_array();
  301. NSM = new Set(read_sorted_array().map(i => CM[i]));
  302. CM = new Set(CM);
  303. ESCAPE = read_sorted_set(); // characters that should not be printed
  304. NFC_CHECK = read_sorted_set(); // only needed to illustrate ens_tokenize() transformations
  305. let chunks = read_sorted_arrays(r);
  306. let unrestricted = r();
  307. //const read_chunked = () => new Set(read_sorted_array().flatMap(i => chunks[i]).concat(read_sorted_array()));
  308. const read_chunked = () => {
  309. // 20230921: build set in parts, 2x faster
  310. let set = new Set();
  311. read_sorted_array().forEach(i => set_add_many(set, chunks[i]));
  312. set_add_many(set, read_sorted_array());
  313. return set;
  314. };
  315. GROUPS = read_array_while(i => {
  316. // minifier property mangling seems unsafe
  317. // so these are manually renamed to single chars
  318. let N = read_array_while(r).map(x => x+0x60);
  319. if (N.length) {
  320. let R = i >= unrestricted; // unrestricted then restricted
  321. N[0] -= 32; // capitalize
  322. N = str_from_cps(N);
  323. if (R) N=`Restricted[${N}]`;
  324. let P = read_chunked(); // primary
  325. let Q = read_chunked(); // secondary
  326. let M = !r(); // not-whitelisted, check for NSM
  327. // *** this code currently isn't needed ***
  328. /*
  329. let V = [...P, ...Q].sort((a, b) => a-b); // derive: sorted valid
  330. let M = r()-1; // number of combining mark
  331. if (M < 0) { // whitelisted
  332. M = new Map(read_array_while(() => {
  333. let i = r();
  334. if (i) return [V[i-1], read_array_while(() => {
  335. let v = read_array_while(r);
  336. if (v.length) return v.map(x => x-1);
  337. })];
  338. }));
  339. }*/
  340. return {N, P, Q, M, R};
  341. }
  342. });
  343. // decode compressed wholes
  344. WHOLE_VALID = read_sorted_set();
  345. WHOLE_MAP = new Map();
  346. let wholes = read_sorted_array().concat(Array_from(WHOLE_VALID)).sort((a, b) => a-b); // must be sorted
  347. wholes.forEach((cp, i) => {
  348. let d = r();
  349. let w = wholes[i] = d ? wholes[i-d] : {V: [], M: new Map()};
  350. w.V.push(cp); // add to member set
  351. if (!WHOLE_VALID.has(cp)) {
  352. WHOLE_MAP.set(cp, w); // register with whole map
  353. }
  354. });
  355. // compute confusable-extent complements
  356. // usage: WHOLE_MAP.get(cp).M.get(cp) = complement set
  357. for (let {V, M} of new Set(WHOLE_MAP.values())) {
  358. // connect all groups that have each whole character
  359. let recs = [];
  360. for (let cp of V) {
  361. let gs = GROUPS.filter(g => group_has_cp(g, cp));
  362. let rec = recs.find(({G}) => gs.some(g => G.has(g)));
  363. if (!rec) {
  364. rec = {G: new Set(), V: []};
  365. recs.push(rec);
  366. }
  367. rec.V.push(cp);
  368. set_add_many(rec.G, gs);
  369. }
  370. // per character cache groups which are not a member of the extent
  371. let union = recs.flatMap(x => Array_from(x.G)); // all of the groups used by this whole
  372. for (let {G, V} of recs) {
  373. let complement = new Set(union.filter(g => !G.has(g))); // groups not covered by the extent
  374. for (let cp of V) {
  375. M.set(cp, complement); // this is the same reference
  376. }
  377. }
  378. }
  379. // compute valid set
  380. // 20230924: VALID was union but can be re-used
  381. VALID = new Set(); // exists in 1+ groups
  382. let multi = new Set(); // exists in 2+ groups
  383. const add_to_union = cp => VALID.has(cp) ? multi.add(cp) : VALID.add(cp);
  384. for (let g of GROUPS) {
  385. for (let cp of g.P) add_to_union(cp);
  386. for (let cp of g.Q) add_to_union(cp);
  387. }
  388. // dual purpose WHOLE_MAP: return placeholder if unique non-confusable
  389. for (let cp of VALID) {
  390. if (!WHOLE_MAP.has(cp) && !multi.has(cp)) {
  391. WHOLE_MAP.set(cp, UNIQUE_PH);
  392. }
  393. }
  394. // add all decomposed parts
  395. // see derive: "Valid is Closed (via Brute-force)"
  396. set_add_many(VALID, nfd(VALID));
  397. // decode emoji
  398. // 20230719: emoji are now fully-expanded to avoid quirk logic
  399. EMOJI_LIST = read_trie(r).map(v => Emoji.from(v)).sort(compare_arrays);
  400. EMOJI_ROOT = new Map(); // this has approx 7K nodes (2+ per emoji)
  401. for (let cps of EMOJI_LIST) {
  402. // 20230719: change to *slightly* stricter algorithm which disallows
  403. // insertion of misplaced FE0F in emoji sequences (matching ENSIP-15)
  404. // example: beautified [A B] (eg. flag emoji)
  405. // before: allow: [A FE0F B], error: [A FE0F FE0F B]
  406. // after: error: both
  407. // note: this code now matches ENSNormalize.{cs,java} logic
  408. let prev = [EMOJI_ROOT];
  409. for (let cp of cps) {
  410. let next = prev.map(node => {
  411. let child = node.get(cp);
  412. if (!child) {
  413. // should this be object?
  414. // (most have 1-2 items, few have many)
  415. // 20230719: no, v8 default map is 4?
  416. child = new Map();
  417. node.set(cp, child);
  418. }
  419. return child;
  420. });
  421. if (cp === FE0F) {
  422. prev.push(...next); // less than 20 elements
  423. } else {
  424. prev = next;
  425. }
  426. }
  427. for (let x of prev) {
  428. x.V = cps;
  429. }
  430. }
  431. }
  432. // if escaped: {HEX}
  433. // else: "x" {HEX}
  434. function quoted_cp(cp) {
  435. return (should_escape(cp) ? '' : `${bidi_qq(safe_str_from_cps([cp]))} `) + quote_cp(cp);
  436. }
  437. // 20230211: some messages can be mixed-directional and result in spillover
  438. // use 200E after a quoted string to force the remainder of a string from
  439. // acquring the direction of the quote
  440. // https://www.w3.org/International/questions/qa-bidi-unicode-controls#exceptions
  441. function bidi_qq(s) {
  442. return `"${s}"\u200E`; // strong LTR
  443. }
  444. function check_label_extension(cps) {
  445. if (cps.length >= 4 && cps[2] == HYPHEN && cps[3] == HYPHEN) {
  446. throw new Error(`invalid label extension: "${str_from_cps(cps.slice(0, 4))}"`); // this can only be ascii so cant be bidi
  447. }
  448. }
  449. function check_leading_underscore(cps) {
  450. const UNDERSCORE = 0x5F;
  451. for (let i = cps.lastIndexOf(UNDERSCORE); i > 0; ) {
  452. if (cps[--i] !== UNDERSCORE) {
  453. throw new Error('underscore allowed only at start');
  454. }
  455. }
  456. }
  457. // check that a fenced cp is not leading, trailing, or touching another fenced cp
  458. function check_fenced(cps) {
  459. let cp = cps[0];
  460. let prev = FENCED.get(cp);
  461. if (prev) throw error_placement(`leading ${prev}`);
  462. let n = cps.length;
  463. let last = -1; // prevents trailing from throwing
  464. for (let i = 1; i < n; i++) {
  465. cp = cps[i];
  466. let match = FENCED.get(cp);
  467. if (match) {
  468. // since cps[0] isn't fenced, cps[1] cannot throw
  469. if (last == i) throw error_placement(`${prev} + ${match}`);
  470. last = i + 1;
  471. prev = match;
  472. }
  473. }
  474. if (last == n) throw error_placement(`trailing ${prev}`);
  475. }
  476. // create a safe to print string
  477. // invisibles are escaped
  478. // leading cm uses placeholder
  479. // if cps exceed max, middle truncate with ellipsis
  480. // quoter(cp) => string, eg. 3000 => "{3000}"
  481. // note: in html, you'd call this function then replace [<>&] with entities
  482. function safe_str_from_cps(cps, max = Infinity, quoter = quote_cp) {
  483. //if (Number.isInteger(cps)) cps = [cps];
  484. //if (!Array.isArray(cps)) throw new TypeError(`expected codepoints`);
  485. let buf = [];
  486. if (is_combining_mark(cps[0])) buf.push('◌');
  487. if (cps.length > max) {
  488. max >>= 1;
  489. cps = [...cps.slice(0, max), 0x2026, ...cps.slice(-max)];
  490. }
  491. let prev = 0;
  492. let n = cps.length;
  493. for (let i = 0; i < n; i++) {
  494. let cp = cps[i];
  495. if (should_escape(cp)) {
  496. buf.push(str_from_cps(cps.slice(prev, i)));
  497. buf.push(quoter(cp));
  498. prev = i + 1;
  499. }
  500. }
  501. buf.push(str_from_cps(cps.slice(prev, n)));
  502. return buf.join('');
  503. }
  504. // note: set(s) cannot be exposed because they can be modified
  505. // note: Object.freeze() doesn't work
  506. function is_combining_mark(cp) {
  507. init();
  508. return CM.has(cp);
  509. }
  510. function should_escape(cp) {
  511. init();
  512. return ESCAPE.has(cp);
  513. }
  514. // return all supported emoji as fully-qualified emoji
  515. // ordered by length then lexicographic
  516. function ens_emoji() {
  517. init();
  518. return EMOJI_LIST.map(x => x.slice()); // emoji are exposed so copy
  519. }
  520. function ens_normalize_fragment(frag, decompose) {
  521. init();
  522. let nf = decompose ? nfd : nfc;
  523. return frag.split(STOP_CH).map(label => str_from_cps(tokens_from_str(explode_cp(label), nf, filter_fe0f).flat())).join(STOP_CH);
  524. }
  525. function ens_normalize(name) {
  526. return flatten(split(name, nfc, filter_fe0f));
  527. }
  528. function ens_beautify(name) {
  529. let labels = split(name, nfc, x => x); // emoji not exposed
  530. for (let {type, output, error} of labels) {
  531. if (error) break; // flatten will throw
  532. // replace leading/trailing hyphen
  533. // 20230121: consider beautifing all or leading/trailing hyphen to unicode variant
  534. // not exactly the same in every font, but very similar: "-" vs "‐"
  535. /*
  536. const UNICODE_HYPHEN = 0x2010;
  537. // maybe this should replace all for visual consistancy?
  538. // `node tools/reg-count.js regex ^-\{2,\}` => 592
  539. //for (let i = 0; i < output.length; i++) if (output[i] == 0x2D) output[i] = 0x2010;
  540. if (output[0] == HYPHEN) output[0] = UNICODE_HYPHEN;
  541. let end = output.length-1;
  542. if (output[end] == HYPHEN) output[end] = UNICODE_HYPHEN;
  543. */
  544. // 20230123: WHATWG URL uses "CheckHyphens" false
  545. // https://url.spec.whatwg.org/#idna
  546. // update ethereum symbol
  547. // ξ => Ξ if not greek
  548. if (type !== 'Greek') array_replace(output, 0x3BE, 0x39E);
  549. // 20221213: fixes bidi subdomain issue, but breaks invariant (200E is disallowed)
  550. // could be fixed with special case for: 2D (.) + 200E (LTR)
  551. // https://discuss.ens.domains/t/bidi-label-ordering-spoof/15824
  552. //output.splice(0, 0, 0x200E);
  553. }
  554. return flatten(labels);
  555. }
  556. function array_replace(v, a, b) {
  557. let prev = 0;
  558. while (true) {
  559. let next = v.indexOf(a, prev);
  560. if (next < 0) break;
  561. v[next] = b;
  562. prev = next + 1;
  563. }
  564. }
  565. function ens_split(name, preserve_emoji) {
  566. return split(name, nfc, preserve_emoji ? x => x.slice() : filter_fe0f); // emoji are exposed so copy
  567. }
  568. function split(name, nf, ef) {
  569. if (!name) return []; // 20230719: empty name allowance
  570. init();
  571. let offset = 0;
  572. // https://unicode.org/reports/tr46/#Validity_Criteria
  573. // 4.) "The label must not contain a U+002E ( . ) FULL STOP."
  574. return name.split(STOP_CH).map(label => {
  575. let input = explode_cp(label);
  576. let info = {
  577. input,
  578. offset, // codepoint, not substring!
  579. };
  580. offset += input.length + 1; // + stop
  581. try {
  582. // 1.) "The label must be in Unicode Normalization Form NFC"
  583. let tokens = info.tokens = tokens_from_str(input, nf, ef);
  584. let token_count = tokens.length;
  585. let type;
  586. if (!token_count) { // the label was effectively empty (could of had ignored characters)
  587. //norm = [];
  588. //type = 'None'; // use this instead of next match, "ASCII"
  589. // 20230120: change to strict
  590. // https://discuss.ens.domains/t/ens-name-normalization-2nd/14564/59
  591. throw new Error(`empty label`);
  592. }
  593. let norm = info.output = tokens.flat();
  594. check_leading_underscore(norm);
  595. let emoji = info.emoji = token_count > 1 || tokens[0].is_emoji; // same as: tokens.some(x => x.is_emoji);
  596. if (!emoji && norm.every(cp => cp < 0x80)) { // special case for ascii
  597. // 20230123: matches matches WHATWG, see note 3.3
  598. check_label_extension(norm); // only needed for ascii
  599. // cant have fenced
  600. // cant have cm
  601. // cant have wholes
  602. // see derive: "Fastpath ASCII"
  603. type = 'ASCII';
  604. } else {
  605. let chars = tokens.flatMap(x => x.is_emoji ? [] : x); // all of the nfc tokens concat together
  606. if (!chars.length) { // theres no text, just emoji
  607. type = 'Emoji';
  608. } else {
  609. // 5.) "The label must not begin with a combining mark, that is: General_Category=Mark."
  610. if (CM.has(norm[0])) throw error_placement('leading combining mark');
  611. for (let i = 1; i < token_count; i++) { // we've already checked the first token
  612. let cps = tokens[i];
  613. if (!cps.is_emoji && CM.has(cps[0])) { // every text token has emoji neighbors, eg. EtEEEtEt...
  614. // bidi_qq() not needed since emoji is LTR and cps is a CM
  615. throw error_placement(`emoji + combining mark: "${str_from_cps(tokens[i-1])} + ${safe_str_from_cps([cps[0]])}"`);
  616. }
  617. }
  618. check_fenced(norm);
  619. let unique = Array_from(new Set(chars));
  620. let [g] = determine_group(unique); // take the first match
  621. // see derive: "Matching Groups have Same CM Style"
  622. // alternative: could form a hybrid type: Latin/Japanese/...
  623. check_group(g, chars); // need text in order
  624. check_whole(g, unique); // only need unique text (order would be required for multiple-char confusables)
  625. type = g.N;
  626. // 20230121: consider exposing restricted flag
  627. // it's simpler to just check for 'Restricted'
  628. // or even better: type.endsWith(']')
  629. //if (g.R) info.restricted = true;
  630. }
  631. }
  632. info.type = type;
  633. } catch (err) {
  634. info.error = err; // use full error object
  635. }
  636. return info;
  637. });
  638. }
  639. function check_whole(group, unique) {
  640. let maker;
  641. let shared = [];
  642. for (let cp of unique) {
  643. let whole = WHOLE_MAP.get(cp);
  644. if (whole === UNIQUE_PH) return; // unique, non-confusable
  645. if (whole) {
  646. let set = whole.M.get(cp); // groups which have a character that look-like this character
  647. maker = maker ? maker.filter(g => set.has(g)) : Array_from(set);
  648. if (!maker.length) return; // confusable intersection is empty
  649. } else {
  650. shared.push(cp);
  651. }
  652. }
  653. if (maker) {
  654. // we have 1+ confusable
  655. // check if any of the remaining groups
  656. // contain the shared characters too
  657. for (let g of maker) {
  658. if (shared.every(cp => group_has_cp(g, cp))) {
  659. throw new Error(`whole-script confusable: ${group.N}/${g.N}`);
  660. }
  661. }
  662. }
  663. }
  664. // assumption: unique.size > 0
  665. // returns list of matching groups
  666. function determine_group(unique) {
  667. let groups = GROUPS;
  668. for (let cp of unique) {
  669. // note: we need to dodge CM that are whitelisted
  670. // but that code isn't currently necessary
  671. let gs = groups.filter(g => group_has_cp(g, cp));
  672. if (!gs.length) {
  673. if (!GROUPS.some(g => group_has_cp(g, cp))) {
  674. // the character was composed of valid parts
  675. // but it's NFC form is invalid
  676. // 20230716: change to more exact statement, see: ENSNormalize.{cs,java}
  677. // note: this doesn't have to be a composition
  678. // 20230720: change to full check
  679. throw error_disallowed(cp); // this should be rare
  680. } else {
  681. // there is no group that contains all these characters
  682. // throw using the highest priority group that matched
  683. // https://www.unicode.org/reports/tr39/#mixed_script_confusables
  684. throw error_group_member(groups[0], cp);
  685. }
  686. }
  687. groups = gs;
  688. if (gs.length == 1) break; // there is only one group left
  689. }
  690. // there are at least 1 group(s) with all of these characters
  691. return groups;
  692. }
  693. // throw on first error
  694. function flatten(split) {
  695. return split.map(({input, error, output}) => {
  696. if (error) {
  697. // don't print label again if just a single label
  698. let msg = error.message;
  699. // bidi_qq() only necessary if msg is digits
  700. throw new Error(split.length == 1 ? msg : `Invalid label ${bidi_qq(safe_str_from_cps(input, 63))}: ${msg}`);
  701. }
  702. return str_from_cps(output);
  703. }).join(STOP_CH);
  704. }
  705. function error_disallowed(cp) {
  706. // TODO: add cp to error?
  707. return new Error(`disallowed character: ${quoted_cp(cp)}`);
  708. }
  709. function error_group_member(g, cp) {
  710. let quoted = quoted_cp(cp);
  711. let gg = GROUPS.find(g => g.P.has(cp)); // only check primary
  712. if (gg) {
  713. quoted = `${gg.N} ${quoted}`;
  714. }
  715. return new Error(`illegal mixture: ${g.N} + ${quoted}`);
  716. }
  717. function error_placement(where) {
  718. return new Error(`illegal placement: ${where}`);
  719. }
  720. // assumption: cps.length > 0
  721. // assumption: cps[0] isn't a CM
  722. // assumption: the previous character isn't an emoji
  723. function check_group(g, cps) {
  724. for (let cp of cps) {
  725. if (!group_has_cp(g, cp)) {
  726. // for whitelisted scripts, this will throw illegal mixture on invalid cm, eg. "e{300}{300}"
  727. // at the moment, it's unnecessary to introduce an extra error type
  728. // until there exists a whitelisted multi-character
  729. // eg. if (M < 0 && is_combining_mark(cp)) { ... }
  730. // there are 3 cases:
  731. // 1. illegal cm for wrong group => mixture error
  732. // 2. illegal cm for same group => cm error
  733. // requires set of whitelist cm per group:
  734. // eg. new Set([...g.P, ...g.Q].flatMap(nfc).filter(cp => CM.has(cp)))
  735. // 3. wrong group => mixture error
  736. throw error_group_member(g, cp);
  737. }
  738. }
  739. //if (M >= 0) { // we have a known fixed cm count
  740. if (g.M) { // we need to check for NSM
  741. let decomposed = nfd(cps);
  742. for (let i = 1, e = decomposed.length; i < e; i++) { // see: assumption
  743. // 20230210: bugfix: using cps instead of decomposed h/t Carbon225
  744. /*
  745. if (CM.has(decomposed[i])) {
  746. let j = i + 1;
  747. while (j < e && CM.has(decomposed[j])) j++;
  748. if (j - i > M) {
  749. throw new Error(`too many combining marks: ${g.N} ${bidi_qq(str_from_cps(decomposed.slice(i-1, j)))} (${j-i}/${M})`);
  750. }
  751. i = j;
  752. }
  753. */
  754. // 20230217: switch to NSM counting
  755. // https://www.unicode.org/reports/tr39/#Optional_Detection
  756. if (NSM.has(decomposed[i])) {
  757. let j = i + 1;
  758. for (let cp; j < e && NSM.has(cp = decomposed[j]); j++) {
  759. // a. Forbid sequences of the same nonspacing mark.
  760. for (let k = i; k < j; k++) { // O(n^2) but n < 100
  761. if (decomposed[k] == cp) {
  762. throw new Error(`duplicate non-spacing marks: ${quoted_cp(cp)}`);
  763. }
  764. }
  765. }
  766. // parse to end so we have full nsm count
  767. // b. Forbid sequences of more than 4 nonspacing marks (gc=Mn or gc=Me).
  768. if (j - i > NSM_MAX) {
  769. // note: this slice starts with a base char or spacing-mark cm
  770. throw new Error(`excessive non-spacing marks: ${bidi_qq(safe_str_from_cps(decomposed.slice(i-1, j)))} (${j-i}/${NSM_MAX})`);
  771. }
  772. i = j;
  773. }
  774. }
  775. }
  776. // *** this code currently isn't needed ***
  777. /*
  778. let cm_whitelist = M instanceof Map;
  779. for (let i = 0, e = cps.length; i < e; ) {
  780. let cp = cps[i++];
  781. let seqs = cm_whitelist && M.get(cp);
  782. if (seqs) {
  783. // list of codepoints that can follow
  784. // if this exists, this will always be 1+
  785. let j = i;
  786. while (j < e && CM.has(cps[j])) j++;
  787. let cms = cps.slice(i, j);
  788. let match = seqs.find(seq => !compare_arrays(seq, cms));
  789. if (!match) throw new Error(`disallowed combining mark sequence: "${safe_str_from_cps([cp, ...cms])}"`);
  790. i = j;
  791. } else if (!V.has(cp)) {
  792. // https://www.unicode.org/reports/tr39/#mixed_script_confusables
  793. let quoted = quoted_cp(cp);
  794. for (let cp of cps) {
  795. let u = UNIQUE.get(cp);
  796. if (u && u !== g) {
  797. // if both scripts are restricted this error is confusing
  798. // because we don't differentiate RestrictedA from RestrictedB
  799. if (!u.R) quoted = `${quoted} is ${u.N}`;
  800. break;
  801. }
  802. }
  803. throw new Error(`disallowed ${g.N} character: ${quoted}`);
  804. //throw new Error(`disallowed character: ${quoted} (expected ${g.N})`);
  805. //throw new Error(`${g.N} does not allow: ${quoted}`);
  806. }
  807. }
  808. if (!cm_whitelist) {
  809. let decomposed = nfd(cps);
  810. for (let i = 1, e = decomposed.length; i < e; i++) { // we know it can't be cm leading
  811. if (CM.has(decomposed[i])) {
  812. let j = i + 1;
  813. while (j < e && CM.has(decomposed[j])) j++;
  814. if (j - i > M) {
  815. throw new Error(`too many combining marks: "${str_from_cps(decomposed.slice(i-1, j))}" (${j-i}/${M})`);
  816. }
  817. i = j;
  818. }
  819. }
  820. }
  821. */
  822. }
  823. // given a list of codepoints
  824. // returns a list of lists, where emoji are a fully-qualified (as Array subclass)
  825. // eg. explode_cp("abc💩d") => [[61, 62, 63], Emoji[1F4A9, FE0F], [64]]
  826. // 20230818: rename for 'process' name collision h/t Javarome
  827. // https://github.com/adraffy/ens-normalize.js/issues/23
  828. function tokens_from_str(input, nf, ef) {
  829. let ret = [];
  830. let chars = [];
  831. input = input.slice().reverse(); // flip so we can pop
  832. while (input.length) {
  833. let emoji = consume_emoji_reversed(input);
  834. if (emoji) {
  835. if (chars.length) {
  836. ret.push(nf(chars));
  837. chars = [];
  838. }
  839. ret.push(ef(emoji));
  840. } else {
  841. let cp = input.pop();
  842. if (VALID.has(cp)) {
  843. chars.push(cp);
  844. } else {
  845. let cps = MAPPED.get(cp);
  846. if (cps) {
  847. chars.push(...cps); // less than 10 elements
  848. } else if (!IGNORED.has(cp)) {
  849. // 20230912: unicode 15.1 changed the order of processing such that
  850. // disallowed parts are only rejected after NFC
  851. // https://unicode.org/reports/tr46/#Validity_Criteria
  852. // this doesn't impact normalization as of today
  853. // technically, this error can be removed as the group logic will apply similar logic
  854. // however the error type might be less clear
  855. throw error_disallowed(cp);
  856. }
  857. }
  858. }
  859. }
  860. if (chars.length) {
  861. ret.push(nf(chars));
  862. }
  863. return ret;
  864. }
  865. function filter_fe0f(cps) {
  866. return cps.filter(cp => cp != FE0F);
  867. }
  868. // given array of codepoints
  869. // returns the longest valid emoji sequence (or undefined if no match)
  870. // *MUTATES* the supplied array
  871. // disallows interleaved ignored characters
  872. // fills (optional) eaten array with matched codepoints
  873. function consume_emoji_reversed(cps, eaten) {
  874. let node = EMOJI_ROOT;
  875. let emoji;
  876. let pos = cps.length;
  877. while (pos) {
  878. node = node.get(cps[--pos]);
  879. if (!node) break;
  880. let {V} = node;
  881. if (V) { // this is a valid emoji (so far)
  882. emoji = V;
  883. if (eaten) eaten.push(...cps.slice(pos).reverse()); // (optional) copy input, used for ens_tokenize()
  884. cps.length = pos; // truncate
  885. }
  886. }
  887. return emoji;
  888. }
  889. // ************************************************************
  890. // tokenizer
  891. const TY_VALID = 'valid';
  892. const TY_MAPPED = 'mapped';
  893. const TY_IGNORED = 'ignored';
  894. const TY_DISALLOWED = 'disallowed';
  895. const TY_EMOJI = 'emoji';
  896. const TY_NFC = 'nfc';
  897. const TY_STOP = 'stop';
  898. function ens_tokenize(name, {
  899. nf = true, // collapse unnormalized runs into a single token
  900. } = {}) {
  901. init();
  902. let input = explode_cp(name).reverse();
  903. let eaten = [];
  904. let tokens = [];
  905. while (input.length) {
  906. let emoji = consume_emoji_reversed(input, eaten);
  907. if (emoji) {
  908. tokens.push({
  909. type: TY_EMOJI,
  910. emoji: emoji.slice(), // copy emoji
  911. input: eaten,
  912. cps: filter_fe0f(emoji)
  913. });
  914. eaten = []; // reset buffer
  915. } else {
  916. let cp = input.pop();
  917. if (cp == STOP) {
  918. tokens.push({type: TY_STOP, cp});
  919. } else if (VALID.has(cp)) {
  920. tokens.push({type: TY_VALID, cps: [cp]});
  921. } else if (IGNORED.has(cp)) {
  922. tokens.push({type: TY_IGNORED, cp});
  923. } else {
  924. let cps = MAPPED.get(cp);
  925. if (cps) {
  926. tokens.push({type: TY_MAPPED, cp, cps: cps.slice()});
  927. } else {
  928. tokens.push({type: TY_DISALLOWED, cp});
  929. }
  930. }
  931. }
  932. }
  933. if (nf) {
  934. for (let i = 0, start = -1; i < tokens.length; i++) {
  935. let token = tokens[i];
  936. if (is_valid_or_mapped(token.type)) {
  937. if (requires_check(token.cps)) { // normalization might be needed
  938. let end = i + 1;
  939. for (let pos = end; pos < tokens.length; pos++) { // find adjacent text
  940. let {type, cps} = tokens[pos];
  941. if (is_valid_or_mapped(type)) {
  942. if (!requires_check(cps)) break;
  943. end = pos + 1;
  944. } else if (type !== TY_IGNORED) { // || type !== TY_DISALLOWED) {
  945. break;
  946. }
  947. }
  948. if (start < 0) start = i;
  949. let slice = tokens.slice(start, end);
  950. let cps0 = slice.flatMap(x => is_valid_or_mapped(x.type) ? x.cps : []); // strip junk tokens
  951. let cps = nfc(cps0);
  952. if (compare_arrays(cps, cps0)) { // bundle into an nfc token
  953. tokens.splice(start, end - start, {
  954. type: TY_NFC,
  955. input: cps0, // there are 3 states: tokens0 ==(process)=> input ==(nfc)=> tokens/cps
  956. cps,
  957. tokens0: collapse_valid_tokens(slice),
  958. tokens: ens_tokenize(str_from_cps(cps), {nf: false})
  959. });
  960. i = start;
  961. } else {
  962. i = end - 1; // skip to end of slice
  963. }
  964. start = -1; // reset
  965. } else {
  966. start = i; // remember last
  967. }
  968. } else if (token.type !== TY_IGNORED) { // 20221024: is this correct?
  969. start = -1; // reset
  970. }
  971. }
  972. }
  973. return collapse_valid_tokens(tokens);
  974. }
  975. function is_valid_or_mapped(type) {
  976. return type == TY_VALID || type == TY_MAPPED;
  977. }
  978. function requires_check(cps) {
  979. return cps.some(cp => NFC_CHECK.has(cp));
  980. }
  981. function collapse_valid_tokens(tokens) {
  982. for (let i = 0; i < tokens.length; i++) {
  983. if (tokens[i].type == TY_VALID) {
  984. let j = i + 1;
  985. while (j < tokens.length && tokens[j].type == TY_VALID) j++;
  986. tokens.splice(i, j - i, {type: TY_VALID, cps: tokens.slice(i, j).flatMap(x => x.cps)});
  987. }
  988. }
  989. return tokens;
  990. }
  991. export { ens_beautify, ens_emoji, ens_normalize, ens_normalize_fragment, ens_split, ens_tokenize, is_combining_mark, nfc, nfd, safe_str_from_cps, should_escape };