remove_diacritics

PHOTO EMBED

Sun Dec 25 2022 15:52:08 GMT+0000 (Coordinated Universal Time)

Saved by @abdalrahmansh #python #kaggle #nlp #arabicnlp #unicode

def remove_diacritics(text : str) -> str:
    '''
        text : "أَهْلًا وسَهْلًا Hello 212"
        output : 
            ---> "أهلا وسهلا Hello 212"
    '''
    chars = [char for char in text if (char not in HARAKAT)]
    output = ''.join(chars)
    return output
content_copyCOPY