-
Notifications
You must be signed in to change notification settings - Fork 1
/
Webscrap_IMDB_Test.py
39 lines (24 loc) · 1007 Bytes
/
Webscrap_IMDB_Test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
""" Fortgeschrittene Softwaretechnik """
""" Teodor Chiaburu, 900526 """
""" Script for testing the class Webscraper """
# classes from the webscraping library
from Webscrap_IMDB_Library import Webscraper, TestWebscraper
if __name__ == '__main__':
# define address of the site to be scraped
top_url = "https://www.imdb.com/chart/moviemeter?sort=rk,asc&mode=simple&page=1"
# instantiate webscraper
webscraper = Webscraper(top_url)
# collect data
webscraper.iterate_films(webscraper.add_films)
# save results as csv file
df = webscraper.convert_to_df()
### TESTS ###
# instantiate tester and add previously obtained data frame
tester = TestWebscraper()
tester.add_dataframe(df)
# test dimensions (should be 100 rows by 5 columns)
tester.test_shape()
# test for NaN values
tester.test_isnan()
# check the starting index
tester.test_start_index()