Skip to content

Commit 71b67b3

Browse files
Updated data_assembler.py [added PageSearch basic support]
1 parent c8d0d67 commit 71b67b3

File tree

1 file changed

+19
-4
lines changed

1 file changed

+19
-4
lines changed

datagather_modules/data_assembler.py

Lines changed: 19 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,12 @@
11
from colorama import Fore, Style
22
import sys
33
sys.path.append('service')
4+
sys.path.append('pagesearch')
45

56
import crawl_processor as cp
67
import dorking_processor as dp
78
import networking_processor as np
9+
from pagesearch_main import normal_search
810

911
try:
1012
import requests
@@ -37,7 +39,7 @@ def report_preprocessing(self, short_domain, report_file_type):
3739
os.makedirs(report_folder, exist_ok=True)
3840
return casename, db_casename, db_creation_date, robots_filepath, sitemap_filepath, sitemap_links_filepath, report_file_type, report_folder, ctime
3941

40-
def data_gathering(self, short_domain, url, report_file_type):
42+
def data_gathering(self, short_domain, url, report_file_type, pagesearch_flag):
4143
casename, db_casename, db_creation_date, robots_filepath, sitemap_filepath, sitemap_links_filepath, report_file_type, report_folder, ctime = self.report_preprocessing(short_domain, report_file_type)
4244
print(Fore.GREEN + "Started scanning domain" + Style.RESET_ALL)
4345
print(Fore.GREEN + "Getting domain IP address" + Style.RESET_ALL)
@@ -83,22 +85,35 @@ def data_gathering(self, short_domain, url, report_file_type):
8385
for key in common_socials:
8486
common_socials[key] = list(set(common_socials[key]))
8587
total_socials = sum(len(values) for values in common_socials.values())
86-
8788
if report_file_type == 'pdf':
8889
data_array = [ip, res, mails, subdomains, subdomains_amount, social_medias, subdomain_mails, sd_socials,
8990
subdomain_ip, issuer, subject, notBefore, notAfter, commonName, serialNumber, mx_records,
9091
robots_txt_result, sitemap_xml_result, sitemap_links_status,
9192
web_servers, cms, programming_languages, web_frameworks, analytics, javascript_frameworks, ports,
9293
hostnames, cpes, tags, vulns, dorking_status, common_socials, total_socials]
94+
if pagesearch_flag.lower() == 'y':
95+
to_search_array = [subdomains, social_medias, sd_socials]
96+
print(Fore.LIGHTMAGENTA_EX + "\n[PAGESEARCH SUBPROCESS START]\n" + Style.RESET_ALL)
97+
normal_search(to_search_array, report_folder)
98+
print(Fore.LIGHTMAGENTA_EX + "\n[PAGESEARCH SUBPROCESS END]\n" + Style.RESET_ALL)
99+
#to_search_array = [subdomains, social_medias, sd_socials, sitemap_links_filepath] WIP
100+
elif pagesearch_flag.lower() == 'n':
101+
pass
93102
elif report_file_type == 'xlsx':
94103
data_array = [ip, res, mails, subdomains, subdomains_amount, social_medias, subdomain_mails, sd_socials,
95104
subdomain_ip, issuer, subject, notBefore, notAfter, commonName, serialNumber, mx_records,
96105
robots_txt_result, sitemap_xml_result, sitemap_links_status,
97106
web_servers, cms, programming_languages, web_frameworks, analytics, javascript_frameworks, ports,
98107
hostnames, cpes, tags, vulns, dorking_status, common_socials, total_socials, parsed_links, subdomain_urls, dorking_results]
108+
if pagesearch_flag.lower() == 'y':
109+
to_search_array = [subdomains, social_medias, sd_socials]
110+
print(Fore.LIGHTMAGENTA_EX + "\n[PAGESEARCH SUBPROCESS START]\n" + Style.RESET_ALL)
111+
normal_search(to_search_array, report_folder)
112+
print(Fore.LIGHTMAGENTA_EX + "\n[PAGESEARCH SUBPROCESS END]\n" + Style.RESET_ALL)
113+
#to_search_array = [subdomains, social_medias, sd_socials, sitemap_links_filepath] WIP
114+
elif pagesearch_flag.lower() == 'n':
115+
pass
99116

100117
report_info_array = [casename, db_casename, db_creation_date, report_folder, ctime, report_file_type]
101118

102119
return data_array, report_info_array
103-
104-

0 commit comments

Comments
 (0)