Skip to content

Commit 61f9144

Browse files
committed
add two more old characters in unicode_normalize
1 parent 231985b commit 61f9144

1 file changed

Lines changed: 2 additions & 0 deletions

File tree

botok/utils/unicode_normalization.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -113,6 +113,7 @@ def normalize_unicode(s, form="nfd"):
113113
s = s.replace("\u0f81", "\u0f71\u0f80") # use is discouraged
114114
if form == "nfd":
115115
s = s.replace("\u0f43", "\u0f42\u0fb7")
116+
s = s.replace("\u0f48", "\u0f47\u0fb7")
116117
s = s.replace("\u0f4d", "\u0f4c\u0fb7")
117118
s = s.replace("\u0f52", "\u0f51\u0fb7")
118119
s = s.replace("\u0f57", "\u0f56\u0fb7")
@@ -121,6 +122,7 @@ def normalize_unicode(s, form="nfd"):
121122
s = s.replace("\u0f76", "\u0fb2\u0f80")
122123
s = s.replace("\u0f78", "\u0fb3\u0f80")
123124
s = s.replace("\u0f93", "\u0f92\u0fb7")
125+
s = s.replace("\u0f98", "\u0f97\u0fb7")
124126
s = s.replace("\u0f9d", "\u0f9c\u0fb7")
125127
s = s.replace("\u0fa2", "\u0fa1\u0fb7")
126128
s = s.replace("\u0fa7", "\u0fa6\u0fb7")

0 commit comments

Comments
 (0)