-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmaoyan_info.py
executable file
·42 lines (40 loc) · 1.38 KB
/
maoyan_info.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#!/usr/bin/env python
# encoding: utf-8
import os
import urllib2
import json
import csv
rowName = [u'category',u'drama',u'name',u'image',u'stars',u'director',u'wishNum',u'score',u'version',u'scoreNum',u'duration',u'id',u'releaseTime']
def dataprocess(html):
content = json.loads(html)
fileName = '/home/lxz/python/maoyan/maoyan_info.csv'
if os.path.exists(fileName):
mode = 'ab'
else:
mode = 'wb'
csvfile = file(fileName,mode)
writer = csv.writer(csvfile)
if mode == 'wb':
writer.writerow([name.encode('utf8') for name in rowName])
for i in content["data"]:
info = [i["category"],i["drama"],i["name"],i["image"],i["stars"],i["director"],i["wishNum"],i["score"],i["version"],i["scoreNum"],i["duration"],i["id"],i["releaseTime"]]
writer.writerow([str(d).encode('utf8') for d in info])
csvfile.close()
def main():
ed = []
IDset = []
IDremain = []
for line in open('/home/lxz/python/maoyan/maoyan.csv'):
ID = line.split(',')[1]
if ID in ed or ID == 'movieId':
continue
url = 'http://piaofang.maoyan.com/movie/baseinfo.json?movie='+str(ID)
html = urllib2.urlopen(url,timeout = 5).read()
dataprocess(html)
print ID
ed.append(ID)
#except Exception,e:
#print e
#continue
if __name__ == '__main__':
main()