Feat: filter out more words
This commit is contained in:
4042
adjectives_10.txt
4042
adjectives_10.txt
File diff suppressed because it is too large
Load Diff
7
main.py
7
main.py
@ -32,7 +32,9 @@ numerical = {
|
|||||||
"dozen", "score", "gross", # Traditional counting units
|
"dozen", "score", "gross", # Traditional counting units
|
||||||
}
|
}
|
||||||
|
|
||||||
names = {"martin", "ben", "john", "maxwell", "ruth", "charlotte", "ada", "dick", "timothy", "earl", "geneva"}
|
innapropriate = {"nigger", "vagina", "rape", "penis"}
|
||||||
|
|
||||||
|
names = {"martin", "ben", "john", "maxwell", "ruth", "charlotte", "ada", "dick", "timothy", "earl", "geneva", "bobby"}
|
||||||
|
|
||||||
difficult = {
|
difficult = {
|
||||||
"aerator", "transducer", "substrate",
|
"aerator", "transducer", "substrate",
|
||||||
@ -86,7 +88,8 @@ def get_words():
|
|||||||
continue # winning, twisiting; only want win, twist or feelings
|
continue # winning, twisiting; only want win, twist or feelings
|
||||||
if word.endswith("s") and not word.endswith("ss"):
|
if word.endswith("s") and not word.endswith("ss"):
|
||||||
continue # leave dutschess but skip provisions
|
continue # leave dutschess but skip provisions
|
||||||
if word in numerical: # skip numbers
|
# exceptions
|
||||||
|
if word in numerical or word in names or word in difficult or word in innapropriate:
|
||||||
continue
|
continue
|
||||||
# If base form matches the word, it's singular/uncountable
|
# If base form matches the word, it's singular/uncountable
|
||||||
if base_form == word:
|
if base_form == word:
|
||||||
|
6702
nouns_10.txt
6702
nouns_10.txt
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user