Add .env file and fix requests

DiegoCaraballo · DiegoCaraballo · commit e378f08380f7 · 2021-02-24T14:51:51.000-03:00
diff --git a/Python/Twitter_Scrapper/README.md b/Python/Twitter_Scrapper/README.md
@@ -2,8 +2,6 @@
 
 This script extracts all Tweets, Retweets, Images, Videos, Hashtags, Likes and Pinned tweet of a specific user in a .csv file.
 
-![How to use the script](https://i.ibb.co/mcjK65f/Tweeter-Scrapper.png)
-
 ### Requirements
 
 1. The system should have  **python**  and  **tweepy**  installed. Also, the user should have a  **Twitter developer account**  and a  **Twitter app**  (if you do not have one, create one at  [here](https://developer.twitter.com/)). The use of Tweepy and need for a developer account is in accordance with the Twitter scraping rules.
@@ -12,15 +10,16 @@ This script extracts all Tweets, Retweets, Images, Videos, Hashtags, Likes and P
 ### Setup
 
 1.  Create a Virtual Environment.
-2.  Install the requirements by using  `pip install -r requirements.txt`
-3. Open the script in any text editor/IDE
-4. Get the credentials from the app created by you on twitter developer account and enter them here.
-5. Also add the path to your chrome driver in the PATH_CHROME_DRIVER constant
-6.  Hurray.! You're ready to use the script to extracts all Tweets, Retweets, Images, Videos, Hashtags and Likes of a specific user.
+2.  Install the requirements by using  `pip3 install -r requirements.txt`
+3. Create a `.env` file like as `.env.example` and add the credentials from the app created by you on twitter developer account.
+4. Also add chrome driver path in .env file
+5.  Hurray.! You're ready to use the script to extracts all Tweets, Retweets, Images, Videos, Hashtags and Likes of a specific user.
 
 ### Running a File
 
 1.  Run the Script  `python twitter_scrapper.py`
-3.  Enter the username you want the information from.
-4. Finally, you need to enter a Twitter username and password in order to extract the pinned Tweet (if it exists)
-5. The .csv file is downloaded to the folder where the file runs.
+2.  Enter the username you want the information from.
+3. Finally, you need to enter a Twitter username and password in order to extract the pinned Tweet (if it exists)
+4. The `.csv` file is downloaded to the folder where the file runs.
+
+![How to use the script](https://i.ibb.co/mcjK65f/Tweeter-Scrapper.png)
diff --git a/Python/Twitter_Scrapper/requirements.txt b/Python/Twitter_Scrapper/requirements.txt
@@ -3,12 +3,14 @@ bs4==0.0.1
 certifi==2020.12.5
 chardet==4.0.0
 idna==2.10
+lxml==4.6.2
 oauthlib==3.1.0
 PySocks==1.7.1
+python-decouple==3.4
 requests==2.25.1
 requests-oauthlib==1.3.0
 selenium==3.141.0
 six==1.15.0
 soupsieve==2.2
 tweepy==3.10.0
-urllib3==1.26.3
+urllib3==1.26.3
diff --git a/Python/Twitter_Scrapper/twitter_scrapper.py b/Python/Twitter_Scrapper/twitter_scrapper.py
@@ -10,19 +10,22 @@
 
 import tweepy
 from bs4 import BeautifulSoup
+from decouple import config
 from selenium import webdriver
 
 # Authenticate to Twitter
-CONSUMER_KEY = "<your-consumer-or-API-key-goes-here>"
-CONSUMER_SECRET = "<your-consumer-or-API-secret-goes-here>"
-ACCESS_KEY = "<your-access-key-goes-here>"
-ACESS_SECRET = "<your-access-secret-goes-here>"
+CONSUMER_KEY = config("CONSUMER_KEY")
+CONSUMER_SECRET = config("CONSUMER_SECRET")
+ACCESS_KEY = config("ACCESS_KEY")
+ACESS_SECRET = config("ACESS_SECRET")
+
+# Authenticate to Twitter
 auth = tweepy.OAuthHandler(CONSUMER_KEY, CONSUMER_SECRET)
 auth.set_access_token(ACCESS_KEY, ACESS_SECRET)
 api = tweepy.API(auth)
 
 URL = "https://twitter.com"
-PATH_CHROME_DRIVER = "<===============ENTER YOUR CHROME DRIVER PATH===========>"
+PATH_CHROME_DRIVER = config("PATH_CHROME_DRIVER")
 random_time_2_to_5 = random.randint(2, 5)
 random_time_5_to_10 = random.randint(5, 10)
 
@@ -99,11 +102,18 @@ def extract_tweets(user_to_scrape):
     try:
         print("Extracting Tweets, Retweets, Media and Hashtags, please wait...!")
 
-        tweets = api.user_timeline(
-            screen_name=user_to_scrape,
-            # 200 is the maximum allowed count
-            count=200,
-        )
+        tweets = None
+
+        try:
+            tweets = api.user_timeline(
+                screen_name=user_to_scrape,
+                # 200 is the maximum allowed count
+                count=200,
+            )
+        except tweepy.TweepError as error:
+            print(error.args[0][0]["message"])
+            time.sleep(2)
+            main()
 
         all_tweets = []
         url_tweets = []