Skip to content

Commit 930339d

Browse files
committed
added more homoglyphs, brought java and js lib versions in sync
1 parent 5ba7fa4 commit 930339d

File tree

10 files changed

+197
-199
lines changed

10 files changed

+197
-199
lines changed

README.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ Include the Homoglyph library in your project by downloading it from Maven Centr
88
<dependency>
99
<groupId>net.codebox</groupId>
1010
<artifactId>homoglyph</artifactId>
11-
<version>1.0.3</version>
11+
<version>1.1.0</version>
1212
</dependency>
1313
```
1414

build.gradle

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
group = "net.codebox"
2-
version = "1.0.3"
2+
version = "1.1.0"
33

44
apply plugin: 'java'
55
apply plugin: 'idea'

generator/source_data/confusables_extras.txt

+4-1
Original file line numberDiff line numberDiff line change
@@ -66,4 +66,7 @@ ff5d ; 7d ; MA # ( } → } )
6666
1D07 ; 45 ; MA # ( E → ᴇ )
6767
1D0A ; 4A ; MA # ( J → ᴊ )
6868
1D18 ; 50 ; MA # ( P → ᴘ )
69-
69+
1D1B ; 54 ; MA # ( T → ᴛ )
70+
03DC ; 46 ; MA # ( F → Ϝ )
71+
03DD ; 66 ; MA # ( f → ϝ )
72+
0030 ; 6F ; MA # ( o → 0 )

javascript/src/homoglyph.js

+61-61
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

javascript/tests/js/tests/DataTests.js

+61-61
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

node/index.js

+61-61
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

node/package.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
{
22
"name": "homoglyph-search",
3-
"version": "1.0.4",
3+
"version": "1.1.0",
44
"description": "A homoglyph-aware text search utility, allows you to search a string for a given word even if that word has been disguised using homoglyph characters",
55
"main": "index.js",
66
"engines" : {

raw_data/char_codes.txt

+3-6
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
2d,2d7,6d4,2010,2011,2012,2013,2043,2212,2796,2cba,fe58
2222
2e,660,6f0,701,702,2024,a4f8,a60e,ff0e,10a50,1d16d
2323
2f,1735,2041,2044,2215,2571,27cb,29f8,2cc6,2f03,3033,30ce,31d3,4e3f,ff0f,1d23a
24-
30,4f,39f,41e,555,7c0,9e6,b20,b66,12d0,2c9e,2d54,3007,a4f3,ff10,ff2f,10292,102ab,10404,104c2,10516,114d0,118b5,118e0,1d40e,1d442,1d476,1d4aa,1d4de,1d512,1d546,1d57a,1d5ae,1d5e2,1d616,1d64a,1d67e,1d6b6,1d6f0,1d72a,1d764,1d79e,1d7ce,1d7d8,1d7e2,1d7ec,1d7f6
24+
30,4f,6f,39f,3bf,3c3,41e,43e,555,585,5e1,647,665,6be,6c1,6d5,6f5,7c0,966,9e6,a66,ae6,b20,b66,be6,c02,c66,c82,ce6,d02,d20,d66,d82,e50,ed0,101d,1040,10ff,12d0,1d0f,1d11,2134,2c9e,2c9f,2d54,3007,a4f3,ab3d,fba6,fba7,fba8,fba9,fbaa,fbab,fbac,fbad,fee9,feea,feeb,feec,ff10,ff2f,ff4f,10292,102ab,10404,1042c,104c2,104ea,10516,114d0,118b5,118c8,118d7,118e0,1d40e,1d428,1d442,1d45c,1d476,1d490,1d4aa,1d4de,1d4f8,1d512,1d52c,1d546,1d560,1d57a,1d594,1d5ae,1d5c8,1d5e2,1d5fc,1d616,1d630,1d64a,1d664,1d67e,1d698,1d6b6,1d6d0,1d6d4,1d6f0,1d70a,1d70e,1d72a,1d744,1d748,1d764,1d77e,1d782,1d79e,1d7b8,1d7bc,1d7ce,1d7d8,1d7e2,1d7ec,1d7f6,1ee24,1ee64,1ee84
2525
31,49,6c,7c,196,1c0,399,406,4c0,5c0,5d5,5df,627,661,6f1,7ca,16c1,2110,2111,2113,2160,217c,2223,23fd,2c92,2d4f,a4f2,fe8d,fe8e,ff11,ff29,ff4c,ffe8,1028a,10309,10320,16f28,1d408,1d425,1d43c,1d459,1d470,1d48d,1d4c1,1d4d8,1d4f5,1d529,1d540,1d55d,1d574,1d591,1d5a8,1d5c5,1d5dc,1d5f9,1d610,1d62d,1d644,1d661,1d678,1d695,1d6b0,1d6ea,1d724,1d75e,1d798,1d7cf,1d7d9,1d7e3,1d7ed,1d7f7,1e8c7,1ee00,1ee80
2626
32,1a7,3e8,14bf,a644,a6ef,a75a,ff12,1d7d0,1d7da,1d7e4,1d7ee,1d7f8
2727
33,1b7,21c,417,4e0,2ccc,a76a,a7ab,ff13,118ca,16f3b,1d206,1d7d1,1d7db,1d7e5,1d7ef,1d7f9
@@ -55,7 +55,7 @@
5555
51,211a,2d55,ff31,1d410,1d444,1d478,1d4ac,1d4e0,1d514,1d57c,1d5b0,1d5e4,1d618,1d64c,1d680
5656
52,1a6,280,13a1,13d2,1587,16b1,211b,211c,211d,a4e3,ab71,aba2,ff32,104b4,16f35,1d216,1d411,1d445,1d479,1d4e1,1d57d,1d5b1,1d5e5,1d619,1d64d,1d681
5757
53,405,54f,13d5,13da,a4e2,ff33,10296,10420,16f3a,1d412,1d446,1d47a,1d4ae,1d4e2,1d516,1d54a,1d57e,1d5b2,1d5e6,1d61a,1d64e,1d682
58-
54,3a4,422,13a2,22a4,27d9,2ca6,a4d4,ff34,10297,102b1,10315,118bc,16f0a,1d413,1d447,1d47b,1d4af,1d4e3,1d517,1d54b,1d57f,1d5b3,1d5e7,1d61b,1d64f,1d683,1d6bb,1d6f5,1d72f,1d769,1d7a3,1f768
58+
54,3a4,3c4,422,442,13a2,1d1b,22a4,27d9,2ca6,a4d4,ab72,ff34,10297,102b1,10315,118bc,16f0a,1d413,1d447,1d47b,1d4af,1d4e3,1d517,1d54b,1d57f,1d5b3,1d5e7,1d61b,1d64f,1d683,1d6bb,1d6d5,1d6f5,1d70f,1d72f,1d749,1d769,1d783,1d7a3,1d7bd,1f768
5959
55,54d,1200,144c,222a,22c3,a4f4,ff35,104ce,118b8,16f42,1d414,1d448,1d47c,1d4b0,1d4e4,1d518,1d54c,1d580,1d5b4,1d5e8,1d61c,1d650,1d684
6060
56,474,667,6f7,13d9,142f,2164,2d38,a4e6,a6df,ff36,1051d,118a0,16f08,1d20d,1d415,1d449,1d47d,1d4b1,1d4e5,1d519,1d54d,1d581,1d5b5,1d5e9,1d61d,1d651,1d685
6161
57,51c,13b3,13d4,a4ea,ff37,118e6,118ef,1d416,1d44a,1d47e,1d4b2,1d4e6,1d51a,1d54e,1d582,1d5b6,1d5ea,1d61e,1d652,1d686
@@ -70,15 +70,14 @@
7070
63,3f2,441,1d04,217d,2ca5,abaf,ff43,1043d,1d41c,1d450,1d484,1d4b8,1d4ec,1d520,1d554,1d588,1d5bc,1d5f0,1d624,1d658,1d68c
7171
64,501,13e7,146f,2146,217e,a4d2,ff44,1d41d,1d451,1d485,1d4b9,1d4ed,1d521,1d555,1d589,1d5bd,1d5f1,1d625,1d659,1d68d
7272
65,435,4bd,212e,212f,2147,ab32,ff45,1d41e,1d452,1d486,1d4ee,1d522,1d556,1d58a,1d5be,1d5f2,1d626,1d65a,1d68e
73-
66,17f,584,1e9d,a799,ab35,ff46,1d41f,1d453,1d487,1d4bb,1d4ef,1d523,1d557,1d58b,1d5bf,1d5f3,1d627,1d65b,1d68f
73+
66,17f,3dd,584,1e9d,a799,ab35,ff46,1d41f,1d453,1d487,1d4bb,1d4ef,1d523,1d557,1d58b,1d5bf,1d5f3,1d627,1d65b,1d68f,1d7cb
7474
67,18d,261,581,1d83,210a,ff47,1d420,1d454,1d488,1d4f0,1d524,1d558,1d58c,1d5c0,1d5f4,1d628,1d65c,1d690
7575
68,4bb,570,13c2,210e,ff48,1d421,1d489,1d4bd,1d4f1,1d525,1d559,1d58d,1d5c1,1d5f5,1d629,1d65d,1d691
7676
69,131,269,26a,2db,37a,3b9,456,4cf,13a5,1fbe,2139,2148,2170,2373,a647,ab75,ff49,118c3,1d422,1d456,1d48a,1d4be,1d4f2,1d526,1d55a,1d58e,1d5c2,1d5f6,1d62a,1d65e,1d692,1d6a4,1d6ca,1d704,1d73e,1d778,1d7b2
7777
6a,3f3,458,2149,ff4a,1d423,1d457,1d48b,1d4bf,1d4f3,1d527,1d55b,1d58f,1d5c3,1d5f7,1d62b,1d65f,1d693
7878
6b,ff4b,1d424,1d458,1d48c,1d4c0,1d4f4,1d528,1d55c,1d590,1d5c4,1d5f8,1d62c,1d660,1d694
7979
6d,ff4d
8080
6e,578,57c,ff4e,1d427,1d45b,1d48f,1d4c3,1d4f7,1d52b,1d55f,1d593,1d5c7,1d5fb,1d62f,1d663,1d697
81-
6f,3bf,3c3,43e,585,5e1,647,665,6be,6c1,6d5,6f5,966,a66,ae6,be6,c02,c66,c82,ce6,d02,d20,d66,d82,e50,ed0,101d,1040,10ff,1d0f,1d11,2134,2c9f,ab3d,fba6,fba7,fba8,fba9,fbaa,fbab,fbac,fbad,fee9,feea,feeb,feec,ff4f,1042c,104ea,118c8,118d7,1d428,1d45c,1d490,1d4f8,1d52c,1d560,1d594,1d5c8,1d5fc,1d630,1d664,1d698,1d6d0,1d6d4,1d70a,1d70e,1d744,1d748,1d77e,1d782,1d7b8,1d7bc,1ee24,1ee64,1ee84
8281
70,3c1,3f1,440,2374,2ca3,ff50,1d429,1d45d,1d491,1d4c5,1d4f9,1d52d,1d561,1d595,1d5c9,1d5fd,1d631,1d665,1d699,1d6d2,1d6e0,1d70c,1d71a,1d746,1d754,1d780,1d78e,1d7ba,1d7c8
8382
71,51b,563,566,ff51,1d42a,1d45e,1d492,1d4c6,1d4fa,1d52e,1d562,1d596,1d5ca,1d5fe,1d632,1d666,1d69a
8483
72,433,1d26,2c85,ab47,ab48,ab81,ff52,1d42b,1d45f,1d493,1d4c7,1d4fb,1d52f,1d563,1d597,1d5cb,1d5ff,1d633,1d667,1d69b
@@ -225,13 +224,11 @@ fe,1bf,3f8
225224
3be,1d6cf,1d709,1d743,1d77d,1d7b7
226225
3c0,3d6,43f,1d28,213c,1d6d1,1d6e1,1d70b,1d71b,1d745,1d755,1d77f,1d78f,1d7b9,1d7c9
227226
3c2,3db,1d6d3,1d70d,1d747,1d781,1d7bb
228-
3c4,442,1d1b,ab72,1d6d5,1d70f,1d749,1d783,1d7bd
229227
3c7,2cad,ab53,ab55,1d6d8,1d712,1d74c,1d786,1d7c0
230228
3c8,471,104f9,1d6d9,1d713,1d74d,1d787,1d7c1
231229
3c9,2375,2cb1,a64d,a7b7,1d6da,1d714,1d74e,1d788,1d7c2
232230
3d7,2ce4
233231
3d8,102ad,10312
234-
3dd,1d7cb
235232
3ec,2cdc
236233
3ff,a73e
237234
404,20ac,2c88,a792

raw_data/chars.txt

+3-6
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ $$
2020
-˗۔‐‑‒–⁃−➖Ⲻ﹘
2121
.٠۰܁܂․ꓸ꘎.𐩐𝅭
2222
/᜵⁁⁄∕╱⟋⧸Ⳇ⼃〳ノ㇓丿/𝈺
23-
0OΟОՕ߀০ଠ୦ዐⲞⵔ〇ꓳ0O𐊒𐊫𐐄𐓂𐔖𑓐𑢵𑣠𝐎𝑂𝑶𝒪𝓞𝔒𝕆𝕺𝖮𝗢𝘖𝙊𝙾𝚶𝛰𝜪𝝤𝞞𝟎𝟘𝟢𝟬𝟶
23+
0OoΟοσОоՕօסه٥ھہە۵߀०০੦૦ଠ୦௦ం౦ಂ೦ംഠ൦ං๐໐ဝ၀ჿዐᴏᴑℴⲞⲟⵔ〇ꓳꬽﮦﮧﮨﮩﮪﮫﮬﮭﻩﻪﻫﻬ0Oo𐊒𐊫𐐄𐐬𐓂𐓪𐔖𑓐𑢵𑣈𑣗𑣠𝐎𝐨𝑂𝑜𝑶𝒐𝒪𝓞𝓸𝔒𝔬𝕆𝕠𝕺𝖔𝖮𝗈𝗢𝗼𝘖𝘰𝙊𝙤𝙾𝚘𝚶𝛐𝛔𝛰𝜊𝜎𝜪𝝄𝝈𝝤𝝾𝞂𝞞𝞸𝞼𝟎𝟘𝟢𝟬𝟶𞸤𞹤𞺄
2424
1Il|ƖǀΙІӀ׀וןا١۱ߊᛁℐℑℓⅠⅼ∣⏽Ⲓⵏꓲﺍﺎ1Il│𐊊𐌉𐌠𖼨𝐈𝐥𝐼𝑙𝑰𝒍𝓁𝓘𝓵𝔩𝕀𝕝𝕴𝖑𝖨𝗅𝗜𝗹𝘐𝘭𝙄𝙡𝙸𝚕𝚰𝛪𝜤𝝞𝞘𝟏𝟙𝟣𝟭𝟷𞣇𞸀𞺀
2525
2ƧϨᒿꙄꛯꝚ2𝟐𝟚𝟤𝟮𝟸
2626
3ƷȜЗӠⳌꝪꞫ3𑣊𖼻𝈆𝟑𝟛𝟥𝟯𝟹
@@ -54,7 +54,7 @@ PΡРᏢᑭᴘᴩℙⲢꓑꮲP𐊕𝐏𝑃𝑷𝒫𝓟𝔓𝕻𝖯𝗣𝘗𝙋
5454
QℚⵕQ𝐐𝑄𝑸𝒬𝓠𝔔𝕼𝖰𝗤𝘘𝙌𝚀
5555
RƦʀᎡᏒᖇᚱℛℜℝꓣꭱꮢR𐒴𖼵𝈖𝐑𝑅𝑹𝓡𝕽𝖱𝗥𝘙𝙍𝚁
5656
SЅՏᏕᏚꓢS𐊖𐐠𖼺𝐒𝑆𝑺𝒮𝓢𝔖𝕊𝕾𝖲𝗦𝘚𝙎𝚂
57-
TΤТᎢ⊤⟙ⲦꓔT𐊗𐊱𐌕𑢼𖼊𝐓𝑇𝑻𝒯𝓣𝔗𝕋𝕿𝖳𝗧𝘛𝙏𝚃𝚻𝛵𝜯𝝩𝞣🝨
57+
TΤτТтᎢᴛ⊤⟙ⲦꓔꭲT𐊗𐊱𐌕𑢼𖼊𝐓𝑇𝑻𝒯𝓣𝔗𝕋𝕿𝖳𝗧𝘛𝙏𝚃𝚻𝛕𝛵𝜏𝜯𝝉𝝩𝞃𝞣𝞽🝨
5858
UՍሀᑌ∪⋃ꓴU𐓎𑢸𖽂𝐔𝑈𝑼𝒰𝓤𝔘𝕌𝖀𝖴𝗨𝘜𝙐𝚄
5959
VѴ٧۷ᏙᐯⅤⴸꓦꛟV𐔝𑢠𖼈𝈍𝐕𝑉𝑽𝒱𝓥𝔙𝕍𝖁𝖵𝗩𝘝𝙑𝚅
6060
WԜᎳᏔꓪW𑣦𑣯𝐖𝑊𝑾𝒲𝓦𝔚𝕎𝖂𝖶𝗪𝘞𝙒𝚆
@@ -69,15 +69,14 @@ bƄЬᏏᖯb𝐛𝑏𝒃𝒷𝓫𝔟𝕓𝖇𝖻𝗯𝘣𝙗𝚋
6969
cϲсᴄⅽⲥꮯc𐐽𝐜𝑐𝒄𝒸𝓬𝔠𝕔𝖈𝖼𝗰𝘤𝙘𝚌
7070
dԁᏧᑯⅆⅾꓒd𝐝𝑑𝒅𝒹𝓭𝔡𝕕𝖉𝖽𝗱𝘥𝙙𝚍
7171
eеҽ℮ℯⅇꬲe𝐞𝑒𝒆𝓮𝔢𝕖𝖊𝖾𝗲𝘦𝙚𝚎
72-
fſքẝꞙꬵf𝐟𝑓𝒇𝒻𝓯𝔣𝕗𝖋𝖿𝗳𝘧𝙛𝚏
72+
fſϝքẝꞙꬵf𝐟𝑓𝒇𝒻𝓯𝔣𝕗𝖋𝖿𝗳𝘧𝙛𝚏𝟋
7373
gƍɡցᶃℊg𝐠𝑔𝒈𝓰𝔤𝕘𝖌𝗀𝗴𝘨𝙜𝚐
7474
hһհᏂℎh𝐡𝒉𝒽𝓱𝔥𝕙𝖍𝗁𝗵𝘩𝙝𝚑
7575
iıɩɪ˛ͺιіӏᎥιℹⅈⅰ⍳ꙇꭵi𑣃𝐢𝑖𝒊𝒾𝓲𝔦𝕚𝖎𝗂𝗶𝘪𝙞𝚒𝚤𝛊𝜄𝜾𝝸𝞲
7676
jϳјⅉj𝐣𝑗𝒋𝒿𝓳𝔧𝕛𝖏𝗃𝗷𝘫𝙟𝚓
7777
kk𝐤𝑘𝒌𝓀𝓴𝔨𝕜𝖐𝗄𝗸𝘬𝙠𝚔
7878
mm
7979
nոռn𝐧𝑛𝒏𝓃𝓷𝔫𝕟𝖓𝗇𝗻𝘯𝙣𝚗
80-
oοσоօסه٥ھہە۵०੦૦௦ం౦ಂ೦ംഠ൦ං๐໐ဝ၀ჿᴏᴑℴⲟꬽﮦﮧﮨﮩﮪﮫﮬﮭﻩﻪﻫﻬo𐐬𐓪𑣈𑣗𝐨𝑜𝒐𝓸𝔬𝕠𝖔𝗈𝗼𝘰𝙤𝚘𝛐𝛔𝜊𝜎𝝄𝝈𝝾𝞂𝞸𝞼𞸤𞹤𞺄
8180
pρϱр⍴ⲣp𝐩𝑝𝒑𝓅𝓹𝔭𝕡𝖕𝗉𝗽𝘱𝙥𝚙𝛒𝛠𝜌𝜚𝝆𝝔𝞀𝞎𝞺𝟈
8281
qԛգզq𝐪𝑞𝒒𝓆𝓺𝔮𝕢𝖖𝗊𝗾𝘲𝙦𝚚
8382
rгᴦⲅꭇꭈꮁr𝐫𝑟𝒓𝓇𝓻𝔯𝕣𝖗𝗋𝗿𝘳𝙧𝚛
@@ -224,13 +223,11 @@ zᴢꮓz𑣄𝐳𝑧𝒛𝓏𝔃𝔷𝕫𝖟𝗓𝘇𝘻𝙯𝚣
224223
ξ𝛏𝜉𝝃𝝽𝞷
225224
πϖпᴨℼ𝛑𝛡𝜋𝜛𝝅𝝕𝝿𝞏𝞹𝟉
226225
ςϛ𝛓𝜍𝝇𝞁𝞻
227-
τтᴛꭲ𝛕𝜏𝝉𝞃𝞽
228226
χⲭꭓꭕ𝛘𝜒𝝌𝞆𝟀
229227
ψѱ𐓹𝛙𝜓𝝍𝞇𝟁
230228
ω⍵ⲱꙍꞷ𝛚𝜔𝝎𝞈𝟂
231229
ϗⳤ
232230
Ϙ𐊭𐌒
233-
ϝ𝟋
234231
ϬⳜ
235232
ϿꜾ
236233
Є€ⲈꞒ

src/test/java/net/codebox/homoglyph/HomoglyphDataTest.java

+1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,7 @@ public void setup() throws IOException {
2222
@Test
2323
public void testLowerCase(){
2424
check("free ϲгеԁıt!", "credit");
25+
check("free ϲrEd1ᴛ", "credit");
2526
check("see best w℮Ꮟc⍺ms here", "webcams");
2627
check("get blue pɪ|ǀs", "pills");
2728
check("саsℎ prizes!!", "cash");

0 commit comments

Comments
 (0)