From 0e6b8d0dcae0fbccee84a1fa6b48bf2a0ea0f52a Mon Sep 17 00:00:00 2001
From: George Tsomlektsis <ultrawelfaredev@gmail.com>
Date: Thu, 24 Jan 2019 21:59:06 +0200
Subject: [PATCH] Added optional parameters for outputting files and folders.

---
 sherlock.py | 87 ++++++++++++++++++++++++++---------------------------
 1 file changed, 43 insertions(+), 44 deletions(-)

diff --git a/sherlock.py b/sherlock.py
index 093594f..a05294f 100644
--- a/sherlock.py
+++ b/sherlock.py
@@ -67,18 +67,6 @@ class ElapsedFuturesSession(FuturesSession):
         return super(ElapsedFuturesSession, self).request(method, url, hooks=hooks, *args, **kwargs)
 
 
-def open_file(fname):
-    return open(fname, "a")
-
-
-def write_to_file(url, f):
-    f.write(url + "\n")
-
-
-def final_score(amount, f):
-    f.write("Total: "+str(amount) + "\n")
-
-
 def print_error(err, errstr, var, verbose=False):
     print(Style.BRIGHT + Fore.WHITE + "[" +
           Fore.RED + "-" +
@@ -151,14 +139,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
                        there was an HTTP error when checking for existence.
     """
     global amount
-    fname = username.lower() + ".txt"
-
-    if os.path.isfile(fname):
-        os.remove(fname)
-        print((Style.BRIGHT + Fore.GREEN + "[" +
-               Fore.YELLOW + "*" +
-               Fore.GREEN + "] Removing previous file:" +
-               Fore.WHITE + " {}").format(fname))
 
     print((Style.BRIGHT + Fore.GREEN + "[" +
            Fore.YELLOW + "*" +
@@ -236,11 +216,11 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
                 future = request_method(url=url, headers=headers,
                                         proxies=proxies,
                                         allow_redirects=allow_redirects
-                                       )
+                                        )
             else:
                 future = request_method(url=url, headers=headers,
                                         allow_redirects=allow_redirects
-                                       )
+                                        )
 
             # Store future in data for access later
             net_info["request_future"] = future
@@ -253,8 +233,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
         results_total[social_network] = results_site
 
     # Open the file containing account links
-    f = open_file(fname)
-
     # Core logic: If tor requests, make them here. If multi-threaded requests, wait for responses
     for social_network, net_info in site_data.items():
 
@@ -297,7 +275,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
             # Checks if the error message is in the HTML
             if not error in r.text:
                 print_found(social_network, url, response_time, verbose)
-                write_to_file(url, f)
                 exists = "yes"
                 amount = amount+1
             else:
@@ -308,7 +285,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
             # Checks if the status code of the response is 2XX
             if not r.status_code >= 300 or r.status_code < 200:
                 print_found(social_network, url, response_time, verbose)
-                write_to_file(url, f)
                 exists = "yes"
                 amount = amount+1
             else:
@@ -324,7 +300,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
             if (r.status_code >= 200) and (r.status_code < 300):
                 #
                 print_found(social_network, url, response_time, verbose)
-                write_to_file(url, f)
                 exists = "yes"
                 amount = amount+1
             else:
@@ -349,14 +324,6 @@ def sherlock(username, site_data, verbose=False, tor=False, unique_tor=False, pr
 
         # Add this site's results into final dictionary with all of the other results.
         results_total[social_network] = results_site
-
-    print((Style.BRIGHT + Fore.GREEN + "[" +
-           Fore.YELLOW + "*" +
-           Fore.GREEN + "] Saved: " +
-           Fore.WHITE + "{}").format(fname))
-
-    final_score(amount, f)
-    f.close()
     return results_total
 
 
@@ -379,9 +346,11 @@ def main():
                         action="store_true",  dest="verbose", default=False,
                         help="Display extra debugging information and metrics."
                         )
-    parser.add_argument("--quiet", "-q",
-                        action="store_false", dest="verbose",
-                        help="Disable debugging information (Default Option)."
+    parser.add_argument("--folderoutput", "-fo", dest="folderoutput",
+                        help="If using multiple usernames, the output of the results will be saved at this folder."
+                        )
+    parser.add_argument("--output", "-o", dest="output",
+                        help="If using single username, the output of the result will be saved at this file."
                         )
     parser.add_argument("--tor", "-t",
                         action="store_true", dest="tor", default=False,
@@ -427,26 +396,35 @@ def main():
         print("Using TOR to make requests")
         print("Warning: some websites might refuse connecting over TOR, so note that using this option might increase connection errors.")
 
+    # Check if both output methods are entered as input.
+    if args.output is not None and args.folderoutput is not None:
+        print("You can only use one of the output methods.")
+        sys.exit(1)
+
+    # Check validity for single username output.
+    if args.output is not None and len(args.username) != 1:
+        print("You can only use --output with a single username")
+        sys.exit(1)
+
     response_json_online = None
     site_data_all = None
 
     # Try to load json from website.
     try:
         response_json_online = requests.get(url=args.json_file)
-    except requests.exceptions.MissingSchema: # In case the schema is wrong it's because it may not be a website
+    except requests.exceptions.MissingSchema:  # In case the schema is wrong it's because it may not be a website
         pass
 
     # Check if the response is appropriate.
     if response_json_online is not None and response_json_online.status_code == 200:
         # Since we got data from a website, try to load json and exit if parsing fails.
-        try: 
+        try:
             site_data_all = response_json_online.json()
         except ValueError:
             print("Invalid JSON from website!")
             sys.exit(1)
             pass
 
-
     data_file_path = os.path.join(os.path.dirname(
         os.path.realpath(__file__)), args.json_file)
     # This will be none if the request had a missing schema
@@ -454,7 +432,8 @@ def main():
         # Check if the file exists otherwise exit.
         if not os.path.exists(data_file_path):
             print("JSON file at doesn't exist.")
-            print("If this is not a file but a website, make sure you have appended http:// or https://.")
+            print(
+                "If this is not a file but a website, make sure you have appended http:// or https://.")
             sys.exit(1)
         else:
             raw = open(data_file_path, "r", encoding="utf-8")
@@ -462,7 +441,7 @@ def main():
                 site_data_all = json.load(raw)
             except:
                 print("Invalid JSON loaded from file.")
-    
+
     if args.site_list is None:
         # Not desired to look at a sub-set of sites
         site_data = site_data_all
@@ -488,10 +467,30 @@ def main():
     # Run report on all specified users.
     for username in args.username:
         print()
+
+        if args.output:
+            file = open(args.output, "w", encoding="utf-8")
+        elif args.folderoutput:  # In case we handle multiple usernames at a targetted folder.
+            # If the folder doesnt exist, create it first
+            if not os.path.isdir(args.folderoutput):
+                os.mkdir(args.folderoutput)
+            file = open(os.path.join(args.folderoutput,
+                                     username + ".txt"), "w", encoding="utf-8")
+        else:
+            file = open(username + ".txt", "w", encoding="utf-8")
         results = {}
         results = sherlock(username, site_data, verbose=args.verbose,
                            tor=args.tor, unique_tor=args.unique_tor, proxy=args.proxy)
 
+        exists_counter = 0
+        for website_name in results:
+            dictionary = results[website_name]
+            if dictionary.get("exists") == "yes":
+                exists_counter += 1
+                file.write(dictionary["url_user"] + "\n")
+        file.write("Total Websites : {}".format(exists_counter))
+        file.close()
+
         if args.csv == True:
             with open(username + ".csv", "w", newline='', encoding="utf-8") as csv_report:
                 writer = csv.writer(csv_report)
@@ -517,4 +516,4 @@ def main():
 
 
 if __name__ == "__main__":
-    main()
+    main()
\ No newline at end of file