Merge pull request #102 from aayaffe/v2.0

Added support for automatic chromedriver management. Removed chrome d…
2024-11-10 06:04:17 +00:00 · 2020-04-11 18:26:45 +05:00 · 2020-04-11 18:26:45 +05:00 · d9dc89ef3a
commit d9dc89ef3a
parent 4ed08fe3d2 3cb987c25b
6 changed files with 6 additions and 17 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,4 +1,3 @@
-
 # Created by https://www.gitignore.io/api/python
 # Edit at https://www.gitignore.io/?templates=python

@ -115,6 +114,9 @@ dmypy.json

 ## Generated data
 /data
+scraper/credentials.yaml
+scraper/input.txt
+scraper/data/

 ## Python venv
 venv
--- a/bin/chromedriver_linux64
+++ b/bin/chromedriver_linux64
--- a/bin/chromedriver_mac64
+++ b/bin/chromedriver_mac64
--- a/bin/chromedriver_win32.exe
+++ b/bin/chromedriver_win32.exe
--- a/scraper/scraper.py
+++ b/scraper/scraper.py
@ -14,6 +14,7 @@ from selenium.webdriver.chrome.options import Options
 from selenium.webdriver.common.by import By
 from selenium.webdriver.support import expected_conditions as EC
 from selenium.webdriver.support.ui import WebDriverWait
+from webdriver_manager.chrome import ChromeDriverManager


 def get_facebook_images_url(img_links):
@ -404,7 +405,6 @@ def save_to_file(name, elements, status, current_section):


 def scrape_data(user_id, scan_list, section, elements_path, save_status, file_names):
-
    """Given some parameters, this function can scrap friends/photos/videos/about/posts(statuses) of a profile"""
    page = []

@ -555,20 +555,8 @@ def login(email, password):

        try:
            platform_ = platform.system().lower()
-            chromedriver_versions = {
-                "linux": os.path.join(
-                    os.getcwd(), CHROMEDRIVER_BINARIES_FOLDER, "chromedriver_linux64",
-                ),
-                "darwin": os.path.join(
-                    os.getcwd(), CHROMEDRIVER_BINARIES_FOLDER, "chromedriver_mac64",
-                ),
-                "windows": os.path.join(
-                    os.getcwd(), CHROMEDRIVER_BINARIES_FOLDER, "chromedriver_win32.exe",
-                ),
-            }
-
            driver = webdriver.Chrome(
-                executable_path=chromedriver_versions[platform_], options=options
+                executable_path=ChromeDriverManager().install(), options=options
            )
        except Exception:
            print(
@ -649,7 +637,6 @@ def scraper(**kwargs):
 # -------------------------------------------------------------

 if __name__ == "__main__":
-
    ap = argparse.ArgumentParser()
    # PLS CHECK IF HELP CAN BE BETTER / LESS AMBIGUOUS
    ap.add_argument(
--- a/setup.py
+++ b/setup.py
@ -27,7 +27,7 @@ setuptools.setup(
    ],
    python_requires=">=3.7",
    extras_require={"dev": ["black", "twine", "wheel"],},
-    install_requires=["selenium==3.141.0", "pyyaml"],
+    install_requires=["selenium==3.141.0", "pyyaml", "webdriver_manager"],
    entry_points={
        "console_scripts": ["ultimate-facebook-scraper=scraper.__main__:scraper",],
    },