使用unicodedata
标准化字符不适用于西里尔字母。如何将西里尔字母转换为拉丁字符?
import unicodedata
cyrillic = 'НОMЕ СHEF'
ordinary = 'HOME CHEF'
print(cyrillic == ordinary)
# prints False, must be True
string = unicodedata.normalize('NFKD', cyrillic)
string = string.encode('ASCII', 'ignore').decode('utf-8')
print(string)
# prints M HEF, must be HOME CHEF