diff options
| author | 2018-11-20 12:00:47 +0000 | |
|---|---|---|
| committer | 2018-11-20 12:00:47 +0000 | |
| commit | 52d5b5da496a9e8bbc2b3098ad943a6b635c3647 (patch) | |
| tree | 1968c1ff6e5746223d2f0dfd4eb8dbed2f70e16d /modules | |
| parent | Detect Armenian script (mixed_unicode.py) (diff) | |
| signature | ||
Detect full-width characters (mixed_unicode.py)
Diffstat (limited to 'modules')
| -rw-r--r-- | modules/mixed_unicode.py | 11 |
1 files changed, 7 insertions, 4 deletions
diff --git a/modules/mixed_unicode.py b/modules/mixed_unicode.py index 9bb9060d..ff5ccf41 100644 --- a/modules/mixed_unicode.py +++ b/modules/mixed_unicode.py @@ -7,19 +7,22 @@ class Script(enum.Enum): Cyrillic = 2 Greek = 3 Armenian = 4 + FullWidth = 5 WORD_SEPERATORS = [",", " ", "\t", "."] class Module(ModuleManager.BaseModule): def _detect_script(self, char): point = ord(char) - if 0 <= point <= 687: + if 0 <= point <= 687: return Script.Latin - elif 880 <= point <= 1023: + elif 880 <= point <= 1023: return Script.Greek - elif 1024 <= point <= 1327: + elif 1024 <= point <= 1327: return Script.Cyrillic - elif 1329 <= point <= 1418: + elif 1329 <= point <= 1418: return Script.Armenian + elif 65281 <= point <= 65376: + return Script.FullWidth return Script.Unknown @utils.hook("received.message.channel") |
