-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathUpdateShowData.py
36 lines (22 loc) · 983 Bytes
/
UpdateShowData.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
import gzip
import shutil
import urllib.request
from GenerateShowData import *
def unzip(fileIn, fileOut):
with gzip.open(fileIn, 'rb') as f_in:
with open(fileOut, 'wb') as f_out:
shutil.copyfileobj(f_in, f_out)
def updateData():
ratingsGet = 'https://datasets.imdbws.com/title.ratings.tsv.gz'
dataFullGet = 'https://datasets.imdbws.com/title.episode.tsv.gz'
showNamesGet = 'https://datasets.imdbws.com/title.basics.tsv.gz'
print("Updating Data Sets. This could take a while.")
urllib.request.urlretrieve(ratingsGet, 'tempData/ratingsGet.tsv.gz')
urllib.request.urlretrieve(dataFullGet, 'tempData/dataFullGet.tsv.gz')
urllib.request.urlretrieve(showNamesGet, 'tempData/showNamesGet.tsv.gz')
unzip("tempData/ratingsGet.tsv.gz", "ratings.csv")
unzip("tempData/dataFullGet.tsv.gz", "dataFull.csv")
unzip("tempData/showNamesGet.tsv.gz", "showNames.csv")
getData()
# Clean up temp files..
updateData()