-
Notifications
You must be signed in to change notification settings - Fork 0
/
adstxtdetect.py
42 lines (31 loc) · 919 Bytes
/
adstxtdetect.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
import os
#Writes all the URLs in the folder into a list of filenames
dirListing = os.listdir(os.getcwd())
#Initialize list of files
editFiles = []
for item in dirListing:
if ".html" in item:
editFiles.append(item)
print(editFiles)
# Checks for common words DIRECT and RESELLER present on ads.txt file.
AdsTxtPositive = []
for website in editFiles:
with open(website) as f:
for line in f:
if 'DIRECT' in line:
print(f.name)
AdsTxtPositive.append(f.name+',Y')
break
elif 'RESELLER' in line:
print(f.name)
AdsTxtPositive.append(f.name+',Y')
break
else:
print(f.name+'noncompliant')
AdsTxtPositive.append(f.name+',N')
break
f.close
woohoo = open('000_Domains.txt', 'w')
for item in AdsTxtPositive:
item2=item.replace('.html','')
woohoo.write("%s\n" %item2)