You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
ORPA-pyOpenRPA/Resources/WPy64-3720/python-3.7.2.amd64/Lib/site-packages/snowballstemmer/hindi_stemmer.py

198 lines
8.0 KiB

# Generated by Snowball 2.0.0 - https://snowballstem.org/
from .basestemmer import BaseStemmer
from .among import Among
class HindiStemmer(BaseStemmer):
'''
This class implements the stemming algorithm defined by a snowball script.
Generated by Snowball 2.0.0 - https://snowballstem.org/
'''
a_0 = [
Among(u"\u0906\u0901", -1, -1),
Among(u"\u093E\u0901", -1, -1),
Among(u"\u0907\u092F\u093E\u0901", 1, -1),
Among(u"\u0906\u0907\u092F\u093E\u0901", 2, -1),
Among(u"\u093E\u0907\u092F\u093E\u0901", 2, -1),
Among(u"\u093F\u092F\u093E\u0901", 1, -1),
Among(u"\u0906\u0902", -1, -1),
Among(u"\u0909\u0906\u0902", 6, -1),
Among(u"\u0941\u0906\u0902", 6, -1),
Among(u"\u0908\u0902", -1, -1),
Among(u"\u0906\u0908\u0902", 9, -1),
Among(u"\u093E\u0908\u0902", 9, -1),
Among(u"\u090F\u0902", -1, -1),
Among(u"\u0906\u090F\u0902", 12, -1),
Among(u"\u0909\u090F\u0902", 12, -1),
Among(u"\u093E\u090F\u0902", 12, -1),
Among(u"\u0924\u093E\u090F\u0902", 15, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u093E\u090F\u0902", 16, -1),
Among(u"\u0928\u093E\u090F\u0902", 15, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0928\u093E\u090F\u0902", 18, -1),
Among(u"\u0941\u090F\u0902", 12, -1),
Among(u"\u0913\u0902", -1, -1),
Among(u"\u0906\u0913\u0902", 21, -1),
Among(u"\u0909\u0913\u0902", 21, -1),
Among(u"\u093E\u0913\u0902", 21, -1),
Among(u"\u0924\u093E\u0913\u0902", 24, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u093E\u0913\u0902", 25, -1),
Among(u"\u0928\u093E\u0913\u0902", 24, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0928\u093E\u0913\u0902", 27, -1),
Among(u"\u0941\u0913\u0902", 21, -1),
Among(u"\u093E\u0902", -1, -1),
Among(u"\u0907\u092F\u093E\u0902", 30, -1),
Among(u"\u0906\u0907\u092F\u093E\u0902", 31, -1),
Among(u"\u093E\u0907\u092F\u093E\u0902", 31, -1),
Among(u"\u093F\u092F\u093E\u0902", 30, -1),
Among(u"\u0940\u0902", -1, -1),
Among(u"\u0924\u0940\u0902", 35, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u0940\u0902", 36, -1),
Among(u"\u0906\u0924\u0940\u0902", 36, -1),
Among(u"\u093E\u0924\u0940\u0902", 36, -1),
Among(u"\u0947\u0902", -1, -1),
Among(u"\u094B\u0902", -1, -1),
Among(u"\u0907\u092F\u094B\u0902", 41, -1),
Among(u"\u0906\u0907\u092F\u094B\u0902", 42, -1),
Among(u"\u093E\u0907\u092F\u094B\u0902", 42, -1),
Among(u"\u093F\u092F\u094B\u0902", 41, -1),
Among(u"\u0905", -1, -1),
Among(u"\u0906", -1, -1),
Among(u"\u0907", -1, -1),
Among(u"\u0908", -1, -1),
Among(u"\u0906\u0908", 49, -1),
Among(u"\u093E\u0908", 49, -1),
Among(u"\u0909", -1, -1),
Among(u"\u090A", -1, -1),
Among(u"\u090F", -1, -1),
Among(u"\u0906\u090F", 54, -1),
Among(u"\u0907\u090F", 54, -1),
Among(u"\u0906\u0907\u090F", 56, -1),
Among(u"\u093E\u0907\u090F", 56, -1),
Among(u"\u093E\u090F", 54, -1),
Among(u"\u093F\u090F", 54, -1),
Among(u"\u0913", -1, -1),
Among(u"\u0906\u0913", 61, -1),
Among(u"\u093E\u0913", 61, -1),
Among(u"\u0915\u0930", -1, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0915\u0930", 64, -1),
Among(u"\u0906\u0915\u0930", 64, -1),
Among(u"\u093E\u0915\u0930", 64, -1),
Among(u"\u093E", -1, -1),
Among(u"\u090A\u0902\u0917\u093E", 68, -1),
Among(u"\u0906\u090A\u0902\u0917\u093E", 69, -1),
Among(u"\u093E\u090A\u0902\u0917\u093E", 69, -1),
Among(u"\u0942\u0902\u0917\u093E", 68, -1),
Among(u"\u090F\u0917\u093E", 68, -1),
Among(u"\u0906\u090F\u0917\u093E", 73, -1),
Among(u"\u093E\u090F\u0917\u093E", 73, -1),
Among(u"\u0947\u0917\u093E", 68, -1),
Among(u"\u0924\u093E", 68, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u093E", 77, -1),
Among(u"\u0906\u0924\u093E", 77, -1),
Among(u"\u093E\u0924\u093E", 77, -1),
Among(u"\u0928\u093E", 68, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0928\u093E", 81, -1),
Among(u"\u0906\u0928\u093E", 81, -1),
Among(u"\u093E\u0928\u093E", 81, -1),
Among(u"\u0906\u092F\u093E", 68, -1),
Among(u"\u093E\u092F\u093E", 68, -1),
Among(u"\u093F", -1, -1),
Among(u"\u0940", -1, -1),
Among(u"\u090A\u0902\u0917\u0940", 88, -1),
Among(u"\u0906\u090A\u0902\u0917\u0940", 89, -1),
Among(u"\u093E\u090A\u0902\u0917\u0940", 89, -1),
Among(u"\u090F\u0902\u0917\u0940", 88, -1),
Among(u"\u0906\u090F\u0902\u0917\u0940", 92, -1),
Among(u"\u093E\u090F\u0902\u0917\u0940", 92, -1),
Among(u"\u0942\u0902\u0917\u0940", 88, -1),
Among(u"\u0947\u0902\u0917\u0940", 88, -1),
Among(u"\u090F\u0917\u0940", 88, -1),
Among(u"\u0906\u090F\u0917\u0940", 97, -1),
Among(u"\u093E\u090F\u0917\u0940", 97, -1),
Among(u"\u0913\u0917\u0940", 88, -1),
Among(u"\u0906\u0913\u0917\u0940", 100, -1),
Among(u"\u093E\u0913\u0917\u0940", 100, -1),
Among(u"\u0947\u0917\u0940", 88, -1),
Among(u"\u094B\u0917\u0940", 88, -1),
Among(u"\u0924\u0940", 88, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u0940", 105, -1),
Among(u"\u0906\u0924\u0940", 105, -1),
Among(u"\u093E\u0924\u0940", 105, -1),
Among(u"\u0928\u0940", 88, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0928\u0940", 109, -1),
Among(u"\u0941", -1, -1),
Among(u"\u0942", -1, -1),
Among(u"\u0947", -1, -1),
Among(u"\u090F\u0902\u0917\u0947", 113, -1),
Among(u"\u0906\u090F\u0902\u0917\u0947", 114, -1),
Among(u"\u093E\u090F\u0902\u0917\u0947", 114, -1),
Among(u"\u0947\u0902\u0917\u0947", 113, -1),
Among(u"\u0913\u0917\u0947", 113, -1),
Among(u"\u0906\u0913\u0917\u0947", 118, -1),
Among(u"\u093E\u0913\u0917\u0947", 118, -1),
Among(u"\u094B\u0917\u0947", 113, -1),
Among(u"\u0924\u0947", 113, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0924\u0947", 122, -1),
Among(u"\u0906\u0924\u0947", 122, -1),
Among(u"\u093E\u0924\u0947", 122, -1),
Among(u"\u0928\u0947", 113, -1, "_HindiStemmer__r_CONSONANT"),
Among(u"\u0905\u0928\u0947", 126, -1),
Among(u"\u0906\u0928\u0947", 126, -1),
Among(u"\u093E\u0928\u0947", 126, -1),
Among(u"\u094B", -1, -1),
Among(u"\u094D", -1, -1)
]
g_consonant = [255, 255, 255, 255, 159, 0, 0, 0, 248, 7]
I_p = 0
def __r_CONSONANT(self):
# (, line 129
if not self.in_grouping_b(HindiStemmer.g_consonant, 2325, 2399):
return False
return True
def _stem(self):
# (, line 131
# test, line 132
v_1 = self.cursor
# (, line 132
# next, line 132
if self.cursor >= self.limit:
return False
self.cursor += 1
# setmark p, line 132
self.I_p = self.cursor
self.cursor = v_1
# backwards, line 133
self.limit_backward = self.cursor
self.cursor = self.limit
# (, line 133
# setlimit, line 139
if self.cursor < self.I_p:
return False
v_3 = self.limit_backward
self.limit_backward = self.I_p
# (, line 139
# [, line 139
self.ket = self.cursor
# substring, line 139
if self.find_among_b(HindiStemmer.a_0) == 0:
self.limit_backward = v_3
return False
# ], line 139
self.bra = self.cursor
self.limit_backward = v_3
# delete, line 321
if not self.slice_del():
return False
self.cursor = self.limit_backward
return True
class lab0(BaseException): pass