-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathutils.py
More file actions
52 lines (42 loc) · 1.36 KB
/
utils.py
File metadata and controls
52 lines (42 loc) · 1.36 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
from json import dumps, loads
from inspect import getmembers, isclass
from scrapy.http.request import Request
from scrapy.http.response import Response
import items
def deserializeLine(line):
obj = loads(line)
if not isinstance(obj, list):
obj = [obj]
lister = []
if obj[0]['type'] == 'spider_settings':
return obj[0]
for element in obj:
if element['type'] == 'request':
request = Request(element['url'])
request.meta.update(element['meta'])
request.meta['callback'] = element['callback']
lister.append(request)
if element['type'] == 'item':
item = dictToItem(element['item'], element['name'])
lister.append(item)
if len(lister) is 1:
return lister[0]
else:
return lister
ItemDict = {}
def dictToItem(d, name):
global ItemDict
if not ItemDict:
ItemDict = {name:obj for name, obj in getmembers(items) if isclass(obj)}
return ItemDict[name](d)
def serializeObject(obj):
if isinstance(obj, Response):
response = {}
response['url'] = obj.url
response['body'] = obj.body
if 'callback' in obj.meta:
response['callback'] = obj.meta['callback']
else:
response['callback'] = 'parse'
response['meta'] = obj.meta
return dumps(response)