You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
# if the literal in anltk.constants.HARAKAT anltk.is_tashkeel('ي') # Falseanltk.is_tashkeel('ِ') # True # if the literal in anltk.constants.ALPHABETanltk.is_arabic_alpha('h') # Falseanltk.is_arabic_alpha('أ') # True# if a character is shamsianltk.is_shamsi('ش')
# True# if a character is qamarianltk.is_qamari('و')
# True
Preprocessing:
anltk.remove_tashkeel('فرَاشَةٌ مُلَوَّنَةٌ تَطِيْرُ في البُسْتَانِ')
# 'فراشة ملونة تطير في البستان'# stop_list contains list of characters that won't be removedanltk.remove_non_alpha('فرَاdشَةٌ مُلَوَّنَ3ةٌ!', stop_list='! ')
# 'فراشة ملونة!'anltk.remove_non_alphanumeric('فرَاdشَةٌ مُلَوَّ3نَةٌ!', stop_list='! ')
# 'فراشة ملو3نة!'anltk.remove_non_alphanumeric_and_tashkeel('فرَاdشَةٌ مُلَوَّ3نَةٌ!', stop_list='! ')
# 'فرَاشَةٌ مُلَوَّ3نَةٌ!'anltk.remove_kasheeda('بســــم الـــله')
# 'بسم الله'# Replaces Hamzaat forms ء, ,آ ؤ, ئ, ئ with أanltk.normalize_hamzat('اللآلئ')
# 'اللألأ'