usse/scrape/venv/lib/python3.10/site-packages/snowballstemmer/french_stemmer.py
2023-12-22 15:26:01 +01:00

968 lines
32 KiB
Python

# Generated by Snowball 2.2.0 - https://snowballstem.org/
from .basestemmer import BaseStemmer
from .among import Among
class FrenchStemmer(BaseStemmer):
'''
This class implements the stemming algorithm defined by a snowball script.
Generated by Snowball 2.2.0 - https://snowballstem.org/
'''
a_0 = [
Among(u"col", -1, -1),
Among(u"par", -1, -1),
Among(u"tap", -1, -1)
]
a_1 = [
Among(u"", -1, 7),
Among(u"H", 0, 6),
Among(u"He", 1, 4),
Among(u"Hi", 1, 5),
Among(u"I", 0, 1),
Among(u"U", 0, 2),
Among(u"Y", 0, 3)
]
a_2 = [
Among(u"iqU", -1, 3),
Among(u"abl", -1, 3),
Among(u"I\u00E8r", -1, 4),
Among(u"i\u00E8r", -1, 4),
Among(u"eus", -1, 2),
Among(u"iv", -1, 1)
]
a_3 = [
Among(u"ic", -1, 2),
Among(u"abil", -1, 1),
Among(u"iv", -1, 3)
]
a_4 = [
Among(u"iqUe", -1, 1),
Among(u"atrice", -1, 2),
Among(u"ance", -1, 1),
Among(u"ence", -1, 5),
Among(u"logie", -1, 3),
Among(u"able", -1, 1),
Among(u"isme", -1, 1),
Among(u"euse", -1, 11),
Among(u"iste", -1, 1),
Among(u"ive", -1, 8),
Among(u"if", -1, 8),
Among(u"usion", -1, 4),
Among(u"ation", -1, 2),
Among(u"ution", -1, 4),
Among(u"ateur", -1, 2),
Among(u"iqUes", -1, 1),
Among(u"atrices", -1, 2),
Among(u"ances", -1, 1),
Among(u"ences", -1, 5),
Among(u"logies", -1, 3),
Among(u"ables", -1, 1),
Among(u"ismes", -1, 1),
Among(u"euses", -1, 11),
Among(u"istes", -1, 1),
Among(u"ives", -1, 8),
Among(u"ifs", -1, 8),
Among(u"usions", -1, 4),
Among(u"ations", -1, 2),
Among(u"utions", -1, 4),
Among(u"ateurs", -1, 2),
Among(u"ments", -1, 15),
Among(u"ements", 30, 6),
Among(u"issements", 31, 12),
Among(u"it\u00E9s", -1, 7),
Among(u"ment", -1, 15),
Among(u"ement", 34, 6),
Among(u"issement", 35, 12),
Among(u"amment", 34, 13),
Among(u"emment", 34, 14),
Among(u"aux", -1, 10),
Among(u"eaux", 39, 9),
Among(u"eux", -1, 1),
Among(u"it\u00E9", -1, 7)
]
a_5 = [
Among(u"ira", -1, 1),
Among(u"ie", -1, 1),
Among(u"isse", -1, 1),
Among(u"issante", -1, 1),
Among(u"i", -1, 1),
Among(u"irai", 4, 1),
Among(u"ir", -1, 1),
Among(u"iras", -1, 1),
Among(u"ies", -1, 1),
Among(u"\u00EEmes", -1, 1),
Among(u"isses", -1, 1),
Among(u"issantes", -1, 1),
Among(u"\u00EEtes", -1, 1),
Among(u"is", -1, 1),
Among(u"irais", 13, 1),
Among(u"issais", 13, 1),
Among(u"irions", -1, 1),
Among(u"issions", -1, 1),
Among(u"irons", -1, 1),
Among(u"issons", -1, 1),
Among(u"issants", -1, 1),
Among(u"it", -1, 1),
Among(u"irait", 21, 1),
Among(u"issait", 21, 1),
Among(u"issant", -1, 1),
Among(u"iraIent", -1, 1),
Among(u"issaIent", -1, 1),
Among(u"irent", -1, 1),
Among(u"issent", -1, 1),
Among(u"iront", -1, 1),
Among(u"\u00EEt", -1, 1),
Among(u"iriez", -1, 1),
Among(u"issiez", -1, 1),
Among(u"irez", -1, 1),
Among(u"issez", -1, 1)
]
a_6 = [
Among(u"a", -1, 3),
Among(u"era", 0, 2),
Among(u"asse", -1, 3),
Among(u"ante", -1, 3),
Among(u"\u00E9e", -1, 2),
Among(u"ai", -1, 3),
Among(u"erai", 5, 2),
Among(u"er", -1, 2),
Among(u"as", -1, 3),
Among(u"eras", 8, 2),
Among(u"\u00E2mes", -1, 3),
Among(u"asses", -1, 3),
Among(u"antes", -1, 3),
Among(u"\u00E2tes", -1, 3),
Among(u"\u00E9es", -1, 2),
Among(u"ais", -1, 3),
Among(u"erais", 15, 2),
Among(u"ions", -1, 1),
Among(u"erions", 17, 2),
Among(u"assions", 17, 3),
Among(u"erons", -1, 2),
Among(u"ants", -1, 3),
Among(u"\u00E9s", -1, 2),
Among(u"ait", -1, 3),
Among(u"erait", 23, 2),
Among(u"ant", -1, 3),
Among(u"aIent", -1, 3),
Among(u"eraIent", 26, 2),
Among(u"\u00E8rent", -1, 2),
Among(u"assent", -1, 3),
Among(u"eront", -1, 2),
Among(u"\u00E2t", -1, 3),
Among(u"ez", -1, 2),
Among(u"iez", 32, 2),
Among(u"eriez", 33, 2),
Among(u"assiez", 33, 3),
Among(u"erez", 32, 2),
Among(u"\u00E9", -1, 2)
]
a_7 = [
Among(u"e", -1, 3),
Among(u"I\u00E8re", 0, 2),
Among(u"i\u00E8re", 0, 2),
Among(u"ion", -1, 1),
Among(u"Ier", -1, 2),
Among(u"ier", -1, 2)
]
a_8 = [
Among(u"ell", -1, -1),
Among(u"eill", -1, -1),
Among(u"enn", -1, -1),
Among(u"onn", -1, -1),
Among(u"ett", -1, -1)
]
g_v = [17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128, 130, 103, 8, 5]
g_keep_with_s = [1, 65, 20, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128]
I_p2 = 0
I_p1 = 0
I_pV = 0
def __r_prelude(self):
while True:
v_1 = self.cursor
try:
try:
while True:
v_2 = self.cursor
try:
try:
v_3 = self.cursor
try:
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab4()
self.bra = self.cursor
try:
v_4 = self.cursor
try:
if not self.eq_s(u"u"):
raise lab6()
self.ket = self.cursor
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab6()
if not self.slice_from(u"U"):
return False
raise lab5()
except lab6: pass
self.cursor = v_4
try:
if not self.eq_s(u"i"):
raise lab7()
self.ket = self.cursor
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab7()
if not self.slice_from(u"I"):
return False
raise lab5()
except lab7: pass
self.cursor = v_4
if not self.eq_s(u"y"):
raise lab4()
self.ket = self.cursor
if not self.slice_from(u"Y"):
return False
except lab5: pass
raise lab3()
except lab4: pass
self.cursor = v_3
try:
self.bra = self.cursor
if not self.eq_s(u"\u00EB"):
raise lab8()
self.ket = self.cursor
if not self.slice_from(u"He"):
return False
raise lab3()
except lab8: pass
self.cursor = v_3
try:
self.bra = self.cursor
if not self.eq_s(u"\u00EF"):
raise lab9()
self.ket = self.cursor
if not self.slice_from(u"Hi"):
return False
raise lab3()
except lab9: pass
self.cursor = v_3
try:
self.bra = self.cursor
if not self.eq_s(u"y"):
raise lab10()
self.ket = self.cursor
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab10()
if not self.slice_from(u"Y"):
return False
raise lab3()
except lab10: pass
self.cursor = v_3
if not self.eq_s(u"q"):
raise lab2()
self.bra = self.cursor
if not self.eq_s(u"u"):
raise lab2()
self.ket = self.cursor
if not self.slice_from(u"U"):
return False
except lab3: pass
self.cursor = v_2
raise lab1()
except lab2: pass
self.cursor = v_2
if self.cursor >= self.limit:
raise lab0()
self.cursor += 1
except lab1: pass
continue
except lab0: pass
self.cursor = v_1
break
return True
def __r_mark_regions(self):
self.I_pV = self.limit
self.I_p1 = self.limit
self.I_p2 = self.limit
v_1 = self.cursor
try:
try:
v_2 = self.cursor
try:
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab2()
if not self.in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab2()
if self.cursor >= self.limit:
raise lab2()
self.cursor += 1
raise lab1()
except lab2: pass
self.cursor = v_2
try:
if self.find_among(FrenchStemmer.a_0) == 0:
raise lab3()
raise lab1()
except lab3: pass
self.cursor = v_2
if self.cursor >= self.limit:
raise lab0()
self.cursor += 1
if not self.go_out_grouping(FrenchStemmer.g_v, 97, 251):
raise lab0()
self.cursor += 1
except lab1: pass
self.I_pV = self.cursor
except lab0: pass
self.cursor = v_1
v_3 = self.cursor
try:
if not self.go_out_grouping(FrenchStemmer.g_v, 97, 251):
raise lab4()
self.cursor += 1
if not self.go_in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab4()
self.cursor += 1
self.I_p1 = self.cursor
if not self.go_out_grouping(FrenchStemmer.g_v, 97, 251):
raise lab4()
self.cursor += 1
if not self.go_in_grouping(FrenchStemmer.g_v, 97, 251):
raise lab4()
self.cursor += 1
self.I_p2 = self.cursor
except lab4: pass
self.cursor = v_3
return True
def __r_postlude(self):
while True:
v_1 = self.cursor
try:
self.bra = self.cursor
among_var = self.find_among(FrenchStemmer.a_1)
if among_var == 0:
raise lab0()
self.ket = self.cursor
if among_var == 1:
if not self.slice_from(u"i"):
return False
elif among_var == 2:
if not self.slice_from(u"u"):
return False
elif among_var == 3:
if not self.slice_from(u"y"):
return False
elif among_var == 4:
if not self.slice_from(u"\u00EB"):
return False
elif among_var == 5:
if not self.slice_from(u"\u00EF"):
return False
elif among_var == 6:
if not self.slice_del():
return False
else:
if self.cursor >= self.limit:
raise lab0()
self.cursor += 1
continue
except lab0: pass
self.cursor = v_1
break
return True
def __r_RV(self):
if not self.I_pV <= self.cursor:
return False
return True
def __r_R1(self):
if not self.I_p1 <= self.cursor:
return False
return True
def __r_R2(self):
if not self.I_p2 <= self.cursor:
return False
return True
def __r_standard_suffix(self):
self.ket = self.cursor
among_var = self.find_among_b(FrenchStemmer.a_4)
if among_var == 0:
return False
self.bra = self.cursor
if among_var == 1:
if not self.__r_R2():
return False
if not self.slice_del():
return False
elif among_var == 2:
if not self.__r_R2():
return False
if not self.slice_del():
return False
v_1 = self.limit - self.cursor
try:
self.ket = self.cursor
if not self.eq_s_b(u"ic"):
self.cursor = self.limit - v_1
raise lab0()
self.bra = self.cursor
try:
v_2 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab2()
if not self.slice_del():
return False
raise lab1()
except lab2: pass
self.cursor = self.limit - v_2
if not self.slice_from(u"iqU"):
return False
except lab1: pass
except lab0: pass
elif among_var == 3:
if not self.__r_R2():
return False
if not self.slice_from(u"log"):
return False
elif among_var == 4:
if not self.__r_R2():
return False
if not self.slice_from(u"u"):
return False
elif among_var == 5:
if not self.__r_R2():
return False
if not self.slice_from(u"ent"):
return False
elif among_var == 6:
if not self.__r_RV():
return False
if not self.slice_del():
return False
v_3 = self.limit - self.cursor
try:
self.ket = self.cursor
among_var = self.find_among_b(FrenchStemmer.a_2)
if among_var == 0:
self.cursor = self.limit - v_3
raise lab3()
self.bra = self.cursor
if among_var == 1:
if not self.__r_R2():
self.cursor = self.limit - v_3
raise lab3()
if not self.slice_del():
return False
self.ket = self.cursor
if not self.eq_s_b(u"at"):
self.cursor = self.limit - v_3
raise lab3()
self.bra = self.cursor
if not self.__r_R2():
self.cursor = self.limit - v_3
raise lab3()
if not self.slice_del():
return False
elif among_var == 2:
try:
v_4 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab5()
if not self.slice_del():
return False
raise lab4()
except lab5: pass
self.cursor = self.limit - v_4
if not self.__r_R1():
self.cursor = self.limit - v_3
raise lab3()
if not self.slice_from(u"eux"):
return False
except lab4: pass
elif among_var == 3:
if not self.__r_R2():
self.cursor = self.limit - v_3
raise lab3()
if not self.slice_del():
return False
else:
if not self.__r_RV():
self.cursor = self.limit - v_3
raise lab3()
if not self.slice_from(u"i"):
return False
except lab3: pass
elif among_var == 7:
if not self.__r_R2():
return False
if not self.slice_del():
return False
v_5 = self.limit - self.cursor
try:
self.ket = self.cursor
among_var = self.find_among_b(FrenchStemmer.a_3)
if among_var == 0:
self.cursor = self.limit - v_5
raise lab6()
self.bra = self.cursor
if among_var == 1:
try:
v_6 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab8()
if not self.slice_del():
return False
raise lab7()
except lab8: pass
self.cursor = self.limit - v_6
if not self.slice_from(u"abl"):
return False
except lab7: pass
elif among_var == 2:
try:
v_7 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab10()
if not self.slice_del():
return False
raise lab9()
except lab10: pass
self.cursor = self.limit - v_7
if not self.slice_from(u"iqU"):
return False
except lab9: pass
else:
if not self.__r_R2():
self.cursor = self.limit - v_5
raise lab6()
if not self.slice_del():
return False
except lab6: pass
elif among_var == 8:
if not self.__r_R2():
return False
if not self.slice_del():
return False
v_8 = self.limit - self.cursor
try:
self.ket = self.cursor
if not self.eq_s_b(u"at"):
self.cursor = self.limit - v_8
raise lab11()
self.bra = self.cursor
if not self.__r_R2():
self.cursor = self.limit - v_8
raise lab11()
if not self.slice_del():
return False
self.ket = self.cursor
if not self.eq_s_b(u"ic"):
self.cursor = self.limit - v_8
raise lab11()
self.bra = self.cursor
try:
v_9 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab13()
if not self.slice_del():
return False
raise lab12()
except lab13: pass
self.cursor = self.limit - v_9
if not self.slice_from(u"iqU"):
return False
except lab12: pass
except lab11: pass
elif among_var == 9:
if not self.slice_from(u"eau"):
return False
elif among_var == 10:
if not self.__r_R1():
return False
if not self.slice_from(u"al"):
return False
elif among_var == 11:
try:
v_10 = self.limit - self.cursor
try:
if not self.__r_R2():
raise lab15()
if not self.slice_del():
return False
raise lab14()
except lab15: pass
self.cursor = self.limit - v_10
if not self.__r_R1():
return False
if not self.slice_from(u"eux"):
return False
except lab14: pass
elif among_var == 12:
if not self.__r_R1():
return False
if not self.out_grouping_b(FrenchStemmer.g_v, 97, 251):
return False
if not self.slice_del():
return False
elif among_var == 13:
if not self.__r_RV():
return False
if not self.slice_from(u"ant"):
return False
return False
elif among_var == 14:
if not self.__r_RV():
return False
if not self.slice_from(u"ent"):
return False
return False
else:
v_11 = self.limit - self.cursor
if not self.in_grouping_b(FrenchStemmer.g_v, 97, 251):
return False
if not self.__r_RV():
return False
self.cursor = self.limit - v_11
if not self.slice_del():
return False
return False
return True
def __r_i_verb_suffix(self):
if self.cursor < self.I_pV:
return False
v_2 = self.limit_backward
self.limit_backward = self.I_pV
self.ket = self.cursor
if self.find_among_b(FrenchStemmer.a_5) == 0:
self.limit_backward = v_2
return False
self.bra = self.cursor
v_3 = self.limit - self.cursor
try:
if not self.eq_s_b(u"H"):
raise lab0()
self.limit_backward = v_2
return False
except lab0: pass
self.cursor = self.limit - v_3
if not self.out_grouping_b(FrenchStemmer.g_v, 97, 251):
self.limit_backward = v_2
return False
if not self.slice_del():
return False
self.limit_backward = v_2
return True
def __r_verb_suffix(self):
if self.cursor < self.I_pV:
return False
v_2 = self.limit_backward
self.limit_backward = self.I_pV
self.ket = self.cursor
among_var = self.find_among_b(FrenchStemmer.a_6)
if among_var == 0:
self.limit_backward = v_2
return False
self.bra = self.cursor
if among_var == 1:
if not self.__r_R2():
self.limit_backward = v_2
return False
if not self.slice_del():
return False
elif among_var == 2:
if not self.slice_del():
return False
else:
if not self.slice_del():
return False
v_3 = self.limit - self.cursor
try:
self.ket = self.cursor
if not self.eq_s_b(u"e"):
self.cursor = self.limit - v_3
raise lab0()
self.bra = self.cursor
if not self.slice_del():
return False
except lab0: pass
self.limit_backward = v_2
return True
def __r_residual_suffix(self):
v_1 = self.limit - self.cursor
try:
self.ket = self.cursor
if not self.eq_s_b(u"s"):
self.cursor = self.limit - v_1
raise lab0()
self.bra = self.cursor
v_2 = self.limit - self.cursor
try:
v_3 = self.limit - self.cursor
try:
if not self.eq_s_b(u"Hi"):
raise lab2()
raise lab1()
except lab2: pass
self.cursor = self.limit - v_3
if not self.out_grouping_b(FrenchStemmer.g_keep_with_s, 97, 232):
self.cursor = self.limit - v_1
raise lab0()
except lab1: pass
self.cursor = self.limit - v_2
if not self.slice_del():
return False
except lab0: pass
if self.cursor < self.I_pV:
return False
v_5 = self.limit_backward
self.limit_backward = self.I_pV
self.ket = self.cursor
among_var = self.find_among_b(FrenchStemmer.a_7)
if among_var == 0:
self.limit_backward = v_5
return False
self.bra = self.cursor
if among_var == 1:
if not self.__r_R2():
self.limit_backward = v_5
return False
try:
v_6 = self.limit - self.cursor
try:
if not self.eq_s_b(u"s"):
raise lab4()
raise lab3()
except lab4: pass
self.cursor = self.limit - v_6
if not self.eq_s_b(u"t"):
self.limit_backward = v_5
return False
except lab3: pass
if not self.slice_del():
return False
elif among_var == 2:
if not self.slice_from(u"i"):
return False
else:
if not self.slice_del():
return False
self.limit_backward = v_5
return True
def __r_un_double(self):
v_1 = self.limit - self.cursor
if self.find_among_b(FrenchStemmer.a_8) == 0:
return False
self.cursor = self.limit - v_1
self.ket = self.cursor
if self.cursor <= self.limit_backward:
return False
self.cursor -= 1
self.bra = self.cursor
if not self.slice_del():
return False
return True
def __r_un_accent(self):
v_1 = 1
while True:
try:
if not self.out_grouping_b(FrenchStemmer.g_v, 97, 251):
raise lab0()
v_1 -= 1
continue
except lab0: pass
break
if v_1 > 0:
return False
self.ket = self.cursor
try:
v_3 = self.limit - self.cursor
try:
if not self.eq_s_b(u"\u00E9"):
raise lab2()
raise lab1()
except lab2: pass
self.cursor = self.limit - v_3
if not self.eq_s_b(u"\u00E8"):
return False
except lab1: pass
self.bra = self.cursor
if not self.slice_from(u"e"):
return False
return True
def _stem(self):
v_1 = self.cursor
self.__r_prelude()
self.cursor = v_1
self.__r_mark_regions()
self.limit_backward = self.cursor
self.cursor = self.limit
v_3 = self.limit - self.cursor
try:
try:
v_4 = self.limit - self.cursor
try:
v_5 = self.limit - self.cursor
try:
v_6 = self.limit - self.cursor
try:
if not self.__r_standard_suffix():
raise lab4()
raise lab3()
except lab4: pass
self.cursor = self.limit - v_6
try:
if not self.__r_i_verb_suffix():
raise lab5()
raise lab3()
except lab5: pass
self.cursor = self.limit - v_6
if not self.__r_verb_suffix():
raise lab2()
except lab3: pass
self.cursor = self.limit - v_5
v_7 = self.limit - self.cursor
try:
self.ket = self.cursor
try:
v_8 = self.limit - self.cursor
try:
if not self.eq_s_b(u"Y"):
raise lab8()
self.bra = self.cursor
if not self.slice_from(u"i"):
return False
raise lab7()
except lab8: pass
self.cursor = self.limit - v_8
if not self.eq_s_b(u"\u00E7"):
self.cursor = self.limit - v_7
raise lab6()
self.bra = self.cursor
if not self.slice_from(u"c"):
return False
except lab7: pass
except lab6: pass
raise lab1()
except lab2: pass
self.cursor = self.limit - v_4
if not self.__r_residual_suffix():
raise lab0()
except lab1: pass
except lab0: pass
self.cursor = self.limit - v_3
v_9 = self.limit - self.cursor
self.__r_un_double()
self.cursor = self.limit - v_9
v_10 = self.limit - self.cursor
self.__r_un_accent()
self.cursor = self.limit - v_10
self.cursor = self.limit_backward
v_11 = self.cursor
self.__r_postlude()
self.cursor = v_11
return True
class lab0(BaseException): pass
class lab1(BaseException): pass
class lab2(BaseException): pass
class lab3(BaseException): pass
class lab4(BaseException): pass
class lab5(BaseException): pass
class lab6(BaseException): pass
class lab7(BaseException): pass
class lab8(BaseException): pass
class lab9(BaseException): pass
class lab10(BaseException): pass
class lab11(BaseException): pass
class lab12(BaseException): pass
class lab13(BaseException): pass
class lab14(BaseException): pass
class lab15(BaseException): pass