forked from kokopi-dev/hipposcraper
-
Notifications
You must be signed in to change notification settings - Fork 0
/
test_file_scraper.py
executable file
·79 lines (73 loc) · 3.25 KB
/
test_file_scraper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
#!/usr/bin/env python2
"""Module for TestFileScraper"""
from scrapers import *
class TestFileScraper:
"""TestFileScraper class
Scrapes test files from any projects.
Args:
soup (obj): BeautifulSoup obj containing parsed link
"""
def __init__(self, soup):
self.soup = soup
self.pre = self.find_test_files()
def find_test_files(self):
return self.soup.select("pre")
def write_test_files(self):
sys.stdout.write(" -> Creating test files... ")
for item in self.pre:
find_test = item.text.find("cat")
find_c = item.text.find("main.c")
find_py = item.text.find(".py")
find_sql = item.text.find(".sql")
find_js = item.text.find(".js")
find_html = item.text.find(".html")
# find_main checks if there are main files on project page
if find_test != -1 and (find_c != -1 or find_py != -1 or find_sql != -1 or find_js != -1 or find_html != -1):
try:
user = item.text.split("$", 1)[0]
name = item.text.split("cat ", 1)[1]
if find_c != -1:
name = name.split(".c", 1)[0] + ".c"
elif find_sql != -1:
name = name.split(".sql", 1)[0] + ".sql"
elif find_js != -1:
name = name.split(".js", 1)[0] + ".js"
else:
name = name.split(".py", 1)[0] + ".py"
# html edge case test text creation
if find_html != -1:
text = item.text.split(".html")[1]
text = str(text.split(user, 1)[0])
text = text.split("\n", 1)[1]
name = name.split(".html", 1)[0] + ".html"
else:
text = item.text.split(name, 1)[1]
text = text.split("\n", 1)[1]
text = text.split(user, 1)[0]
text = text.split("\n")
w_test_file = open(name, "w+")
for i in range(len(text) - 1):
if find_html != -1:
w_test_file.write(text[i])
else:
w_test_file.write(text[i].encode('utf-8') + "\n".encode('utf-8'))
w_test_file.close()
except (AttributeError, IndexError):
newlines = 0
# Checks if test file's name has more than 1 newline
for i in name:
if newlines > 1:
name = "[Not a test file]"
break
if i == "\n":
newlines += 1
sys.stdout.write("[ERROR] Could not create ")
sys.stdout.write("test file %s\n" % name)
sys.stdout.write(" ... ")
continue
except IOError:
sys.stdout.write("\n [ERROR] Could not create a specific test file.\n")
continue
else:
pass
print("done")