From 192e2c333e0116e7f9a1ffafb991f06ca2b26cf0 Mon Sep 17 00:00:00 2001 From: rsb-23 <57601627+rsb-23@users.noreply.github.com> Date: Tue, 3 Sep 2024 21:04:10 +0530 Subject: [PATCH] Fixed false positives #2273 - Updated user-agent in header and removed duplicate - --- sherlock_project/resources/data.json | 45 +++++++++++----------------- sherlock_project/sherlock.py | 2 +- 2 files changed, 19 insertions(+), 28 deletions(-) diff --git a/sherlock_project/resources/data.json b/sherlock_project/resources/data.json index 8f38fd0..12914b1 100644 --- a/sherlock_project/resources/data.json +++ b/sherlock_project/resources/data.json @@ -682,9 +682,7 @@ "Duolingo": { "errorMsg": "{\"users\":[]}", "errorType": "message", - "headers": { - "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/116.0" - }, + "url": "https://www.duolingo.com/profile/{}", "urlMain": "https://duolingo.com/", "urlProbe": "https://www.duolingo.com/2017-06-30/users?username={}", @@ -754,8 +752,7 @@ "username_claimed": "finanzfrage" }, "Fiverr": { - "errorMsg": "\"status\":\"success\"", - "errorType": "message", + "errorType": "status_code", "regexCheck": "^[A-Za-z][A-Za-z\\d_]{5,14}$", "request_method": "POST", "request_payload": { @@ -996,7 +993,7 @@ "username_claimed": "adam" }, "HackenProof (Hackers)": { - "errorMsg": "
Error: This user doesn't exist
", "errorType": "message", + "headers": { + "Cookie": "LTAnonSessionID=3159599315; LTUnifiedCookie=%7B%22areyouhuman%22%3A1%7D; " + }, "url": "https://www.librarything.com/profile/{}", "urlMain": "https://www.librarything.com/", "username_claimed": "blue" }, "Lichess": { - "errorMsg": "Page not found!", - "errorType": "message", + "errorType": "status_code", "url": "https://lichess.org/@/{}", "urlMain": "https://lichess.org", "username_claimed": "blue" }, "LinkedIn": { "errorType": "status_code", - "headers": { - "User-Agent": "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Chrome/W.X.Y.Z Safari/537.36" - }, + "regexCheck": "^[a-zA-Z0-9]{3,100}$", "request_method": "GET", "url": "https://linkedin.com/in/{}", @@ -1964,9 +1958,7 @@ }, "Spotify": { "errorType": "status_code", - "headers": { - "user-agent": "PostmanRuntime/7.29.2" - }, + "url": "https://open.spotify.com/user/{}", "urlMain": "https://open.spotify.com/", "username_claimed": "blue" @@ -2205,7 +2197,8 @@ "username_claimed": "jenny" }, "Vero": { - "errorType": "status_code", + "errorMsg": "Not Found", + "errorType": "message", "request_method": "GET", "url": "https://vero.co/{}", "urlMain": "https://vero.co/", @@ -2375,9 +2368,7 @@ }, "YouTube": { "errorType": "status_code", - "headers": { - "User-Agent": "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Chrome/W.X.Y.Z Safari/537.36" - }, + "url": "https://www.youtube.com/@{}", "urlMain": "https://www.youtube.com/", "username_claimed": "youtube" @@ -2803,4 +2794,4 @@ "urlMain": "https://znanylekarz.pl", "username_claimed": "janusz-nowak" } -} +} \ No newline at end of file diff --git a/sherlock_project/sherlock.py b/sherlock_project/sherlock.py index e36ca6c..c87dfd5 100644 --- a/sherlock_project/sherlock.py +++ b/sherlock_project/sherlock.py @@ -261,7 +261,7 @@ def sherlock( # A user agent is needed because some sites don't return the correct # information since they think that we are bots (Which we actually are...) headers = { - "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/116.0", + "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:129.0) Gecko/20100101 Firefox/129.0", } if "headers" in net_info: