From a7d0e5aff2b46df08f52ed9fff95536ccfc9f087 Mon Sep 17 00:00:00 2001 From: hkc Date: Tue, 5 Mar 2024 15:46:49 +0300 Subject: [PATCH] Filter words tweaking --- nfuck/link_verifier.py | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/nfuck/link_verifier.py b/nfuck/link_verifier.py index 07e35b6..f9ea4e3 100644 --- a/nfuck/link_verifier.py +++ b/nfuck/link_verifier.py @@ -19,14 +19,17 @@ USER_AGENT = [ REGEX_PATTERNS: list[tuple[float, Pattern, str]] = [ (1.0, regexp(r"\bp2e\b", IGNORECASE), "Play-to-earn keyword"), (5.0, regexp(r"play\-to\-earn", IGNORECASE), "Play-to-earn directly"), - (3.0, regexp(r"encryption\.js", IGNORECASE), "Metamask"), - (2.0, regexp(r"\bweb3\b", IGNORECASE), "Web3 mention"), + (3.0, regexp(r"encryption\.js", IGNORECASE), "encryption.js"), + (3.0, regexp(r"web3-ethers\.js", IGNORECASE), "web3-ethers.js"), + (1.0, regexp(r"\bweb3\b", IGNORECASE), "Web3 mention"), (1.0, regexp(r"\bnft\b", IGNORECASE), "NFT mention"), - (0.7, regexp(r"\belon\b", IGNORECASE), "Cryptobro Elon"), - (0.5, regexp(r"\bbiden\b", IGNORECASE), "Sleepy Joe"), - (1.0, regexp(r"\bcrypto\b", IGNORECASE), "Crypto mention"), (3.0, regexp(r"What The Fluff | CLAIM ALL !", IGNORECASE), "WTF Claim all"), (3.0, regexp(r"Suckerberg's Nutsack", IGNORECASE), "Suckerberg balls"), + (4.0, regexp(r"\w+: Claim your first \w+ and lets P2E", IGNORECASE), "Claim your first bs"), + (5.0, regexp(r"https://twitter\.com/what_thefluff"), "Link to what the fluff twitter"), + (3.0, regexp(r"Discover what \ \w+ will become your", IGNORECASE), "Some random button from common scam website"), + (3.0, regexp(r"fluff (token|coin)", IGNORECASE), "fluff token/coin"), + (3.0, regexp(r"A collection of \w+ NFTs", IGNORECASE), "Collection of [some] NFTs"), ] MAX_SCORE = sum(t[0] for t in REGEX_PATTERNS)