File size: 1,298 Bytes
2b9435d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 |
import re
def is_spam(message):
message = message.lower()
# Check for repeated phrases and URL shorteners
url_shorteners = ['bit.ly', 'goo.gl', 'me2.kr', 'vo.la', 'vvd.bz', '์คํํก.com', 'openkakao.at', 'openkakao.io', 'openkakao.it']
patterns = [
r'\b(https?|ftp)://[^\s/$.?#].[^\s]*\b',
r'\b(www\.)[^\s/$.?#].[^\s]*\b'
]
for pattern in patterns:
urls = re.findall(pattern, message)
for url in urls:
for shortener in url_shorteners:
if shortener.lower() in url:
return True
spam_phrases = [
'๊ด๊ณ )',
'์ ์ค',
'์ํ๊ฐ',
'์ต์ 150%',
'๋ฌด๋ฃ๊ฑฐ๋ถ',
'์ข
๋ชฉ ์ถ์ฒ',
'์ต๊ณ ๊ธ ์ ๋ณด',
'์์ต๋ฅ ',
'์์น ํ์ ',
'์ต์ ',
'๋์ ์ํฅ๋ ฅ',
' ๋ฐํ ์์ ',
'ํ์ง๊ตญ',
' ํ์ธ ๋ฐ๋ผ',
'์ฌ์ ์ฆ์',
' ์
์ฅ ๊ฐ',
'๋จ๋
๋ฐํ',
' ์ด์ง ๊ฑด์ ',
' ๋ฐฉ์ ์ค๊ณ',
' ํํ',
'์๋ฐฉํฅ ๊ฑฐ๋',
'์ถ์ ์ข
๋ชฉ',
'์์น ๊ฐ',
' ํ์ด๋ฉ',
]
for phrase in spam_phrases:
if phrase.lower() in message.lower():
return True
return False
|