diff --git a/antiabuse/normalize/__init__.py b/antiabuse/normalize/__init__.py index bebe40f..851935b 100644 --- a/antiabuse/normalize/__init__.py +++ b/antiabuse/normalize/__init__.py @@ -16,6 +16,7 @@ "c+[uv]+m+s+": "cums", "cvmming": "cumming", "cvmshot": "cumshot", + "dyck": "dick", "ejakulate": "ejaculate", "fcked": "fucked", "fck": "fuck", @@ -36,6 +37,7 @@ "ngger": "nigger", "nggr": "nigger", "n[ie]g{1,2}re{1,2}s+": "negress", + "niga": "nigga", "nigge": "nigger", "nigg": "nigger", "p0rn": "porn", @@ -116,9 +118,7 @@ def _remove_zero_width_characters(s: str): def normalize_string(s: str): - # Normalize the string to NFD (Normalization Form Decomposition) and Filter - # out combining diacritical marks (e.g., accents) - normalized_input = unicodedata.normalize('NFKC', s) + normalized_input = unicodedata.normalize('NFKD', s) normalized_input = ''.join( char for char in normalized_input if not unicodedata.combining(char) ) diff --git a/antiabuse/normalize/test_init.py b/antiabuse/normalize/test_init.py index 560ba45..969b55b 100644 --- a/antiabuse/normalize/test_init.py +++ b/antiabuse/normalize/test_init.py @@ -28,6 +28,12 @@ def test_normalize_string(self): self.assertEqual(normalize_string("niggreess"), "negress") + self.assertEqual(normalize_string("slūt"), "slut") + + self.assertEqual(normalize_string("dyck"), "dick") + + self.assertEqual(normalize_string("niga"), "nigga") + if __name__ == '__main__': unittest.main() diff --git a/banned-club.sql b/banned-club.sql index 0f34e93..ec0b0b7 100644 --- a/banned-club.sql +++ b/banned-club.sql @@ -397,6 +397,7 @@ VALUES ('big dick'), ('big dick club'), ('big dick deviant'), + ('big pervert'), ('big thick cock'), ('big tits'), ('big white cock'), @@ -452,6 +453,7 @@ VALUES ('bug people hater'), ('bugs hater'), ('bukkake'), + ('bulimia'), ('bully bait'), ('bullybait'), ('bum sex'), @@ -616,6 +618,7 @@ VALUES ('cutmaxxer'), ('cutmaxxing'), ('cut me'), + ('cuts'), ('cutslut'), ('cutsluts'), ('cutter'), @@ -632,6 +635,8 @@ VALUES ('deep ass thinker'), ('deepfake'), ('definitely retarded'), + ('degradee'), + ('degrader'), ('deport asians'), ('deport black people'), ('deport blacks'), @@ -705,6 +710,7 @@ VALUES ('dogfuckr'), ('domestic abuse'), ('domestic terrorist'), + ('domestic violence'), ('donkey punch'), ('don''t be trans'), ('dothead'), @@ -939,6 +945,7 @@ VALUES ('fuck irish people'), ('fuck islam'), ('fuck israel'), + ('fuckisrael'), ('fuck jewish people'), ('fuck jews'), ('fuck judaism'), @@ -965,6 +972,7 @@ VALUES ('fuck my pathetic nigger life'), ('fuck my retard life'), ('fuck nazis'), + ('fucknebby'), ('fuck niggers'), ('fuck nigs'), ('fuck norway'), @@ -1083,6 +1091,7 @@ VALUES ('gook'), ('gooks'), ('goon'), + ('goon3r'), ('goonasmaximus'), ('goon blue lock'), ('goon cave gang'), @@ -1094,10 +1103,13 @@ VALUES ('gooner but also ace'), ('goonercell'), ('gooner club'), + ('goonergoth'), + ('goonerific'), ('goonerlicious'), ('gooner lover'), ('gooners'), ('gooners dni'), + ('goonett3'), ('goonette'), ('goongang'), ('gooning'), @@ -1110,6 +1122,7 @@ VALUES ('goon-ion'), ('goon larper'), ('goonmaxxing'), + ('goonpill'), ('goonpilled'), ('goonqueen'), ('goonsexual'), @@ -1127,6 +1140,7 @@ VALUES ('goysloppers'), ('goyslop rejecters'), ('grape'), + ('grapeist'), ('grape me'), ('grapist'), ('grass fucker'), @@ -1259,6 +1273,7 @@ VALUES ('hitler''s top guy'), ('hitlers top guy'), ('hitlerstrongest jannissary'), + ('hitlerstruewarriors'), ('hitler youth'), ('homeless nigga'), ('homicidal'), @@ -1287,6 +1302,7 @@ VALUES ('huge tits'), ('hurt me'), ('husband beater'), + ('hyperborea'), ('hypersexual'), ('i abuse men'), ('i abuse women'), @@ -1786,11 +1802,14 @@ VALUES ('i wipe my ass and i slap my nuts'), ('jacking off'), ('jailbait'), + ('jelking'), + ('jelq'), ('jelq king'), ('jelqmaxxer'), ('jerking off as you''re reading this'), ('jerking off counts as a hobby'), ('jerking off rn'), + ('jerkmaxxer'), ('jerusalem hate'), ('jew beater'), ('jew gasser'), @@ -2157,6 +2176,7 @@ VALUES ('muslim hater'), ('muslims hater'), ('my face is a chair'), + ('n'), ('nate higgers'), ('national socialism'), ('national socialist'), @@ -2207,6 +2227,7 @@ VALUES ('nigga love'), ('niggamaxxing'), ('nigga penis'), + ('niggar'), ('niggarapist'), ('niggas'), ('niggastyle'), @@ -2253,6 +2274,7 @@ VALUES ('not a paedophile'), ('not a pedophile'), ('not even a femcel bc i fuck irl'), + ('noticer'), ('not over 18'), ('not retarded'), ('not sexual'), @@ -2298,6 +2320,7 @@ VALUES ('paraphilias'), ('part time gooner'), ('passionate sex'), + ('patern noticer'), ('patricide'), ('pattern noticer'), ('pausedmygoonseshtobehere'), @@ -2542,6 +2565,7 @@ VALUES ('rope maxxing'), ('ropemaxxing'), ('rough sex'), + ('rule 34'), ('russiaphobe'), ('russiaphobic'), ('russophobe'), @@ -2901,6 +2925,7 @@ VALUES ('veiny dick'), ('verbal abuse'), ('victim'), + ('violence enjoyer'), ('violencepilled'), ('violent'), ('virgin suicide'), diff --git a/service/chat/rude/__init__.py b/service/chat/rude/__init__.py index 9ca2d2e..cbede2e 100644 --- a/service/chat/rude/__init__.py +++ b/service/chat/rude/__init__.py @@ -38,13 +38,20 @@ "bellend", "benis", "bestiality", + "bewbies", "bitch", "blow job", "blow jobs", "blowjob", "blowjobs", "boobies", + "boobs", + "breading me", + "breading you", "breasts", + "breed me", + "breed you", + "breedable", "bukkake", "butt fuck", "butt fucked", @@ -100,6 +107,7 @@ "cuntlicker", "cuntlicking", "cunts", + "cut herself", "cut me", "cut my wrist", "cut my wrists", @@ -146,6 +154,7 @@ "faggitt", "faggot", "faggots", + "fags", "fannyflaps", "fannyfucker", "fanyy", @@ -197,9 +206,13 @@ "golden shower", "gook", "gooks", + "gooner", "gooners", "goonette", "goonettes", + "gooning", + "goonmaxxing", + "goyish", "hand job", "hand-job", "handjob", @@ -211,6 +224,7 @@ "hanging yourself", "heil", "hit it raw", + "ho", "hoe", "hoes", "homo", @@ -380,18 +394,23 @@ "spit on you", "spit on your face", "spit on your mouth", + "stab me", + "stab you", "stabbing me", "stabbing you", "strangle me", "strangle you", + "stroking it", "suicidal", "suicide", "testicle", + "thot", "throat fuck", "throat fucking", "throat pussy", "throatfuck", "throatfucking", + "tiddies", "tie me", "tie you", "tit fuck", @@ -418,6 +437,8 @@ "tittywank", "titwank", "tnd", + "to goon", + "tranner", "trannies", "tranny", "troon",