-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathrouteUtils.py
104 lines (83 loc) · 3.56 KB
/
routeUtils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
#!/usr/bin/env python3
import re
import random
from resty import restDriver
from routing import RouterManager
ipPortRegCompile = re.compile('(.+):([^:]+)$', re.UNICODE)
class Router:
def __init__(self, addrList, hashBase=10):
self.__addrList = addrList
self.__addrToDriverMap = {}
self.initAddrMapping(addrList, hashBase)
def initAddrMapping(self, addrList, hashBase=10):
self.__routeManager = RouterManager.RouterManager(hashBase=hashBase, serverAddrList=addrList)
routeMapList = self.__routeManager.getRoutingAddresses()
for addr in routeMapList:
# Build WorkerManagers
ipPortSearch = ipPortRegCompile.search(addr)
if ipPortSearch:
target = ipPortSearch.groups(1)
wD = WorkerDriver(*target)
self.__addrToDriverMap[addr] = wD
def getWorkerDriver(self, item):
associatedAddr = self.__routeManager.getRoute(item.__hash__())
return self.__addrToDriverMap.get(associatedAddr, None)
class WorkerDriver:
def __init__(self, ip, port):
self.__workerId = -1
self.getDefaultAuthor = restDriver.getDefaultAuthor
print('ip', ip, 'port', port)
self.initMainRestDriver(ip, port)
self.initWorker()
self.initRouting()
def initMainRestDriver(self, ip, port):
self.restDriver = restDriver.RestDriver(ip, port)
wHandler = self.restDriver.registerLiason('Worker', '/jobTable/workerHandler')
assert(wHandler)
jHandler = self.restDriver.registerLiason('Job', '/jobTable/jobHandler')
assert(jHandler)
rHandler = self.restDriver.registerLiason('Route', '/jobTable/routeHandler')
assert(rHandler)
def initRouting(self):
baseUrl = self.restDriver.getBaseUrl()
rResponse = self.restDriver.getRoutes(address=baseUrl)
value = rResponse.get('value', {})
if rResponse.get('status_code', 400) == 200 and value.get('data', None):
print('Already registered', baseUrl)
else:
cResponse = self.restDriver.newRoute(
address=self.restDriver.getBaseUrl()
)
print('After logging the route', cResponse)
# Let's now get the list of all present routes
routeManifest = self.restDriver.getRoutes(select='address')
if routeManifest.get('status_code', 400) == 200:
data = routeManifest.get('data', None) or []
addrList = []
for item in data:
addr = item.get('address', None)
if addr:
addrList.append(addr)
# print('addrList', addrList)
def getWorkerId(self):
return self.__workerId
def initWorker(self):
workerCheck = self.restDriver.getWorkers(
purpose='Crawling', select='id', format='short'
).get('value', {})
if workerCheck.get('data', None):
workersPresent = workerCheck['data']
randWorkerId = random.sample(workersPresent, 1)[0].get('id', -1)
self.__workerId = randWorkerId
print('Present workers: {wp} randPickedWorker: {rw}'.format(
wp=workersPresent, rw=randWorkerId)
)
else:
nwResp = self.restDriver.newWorker(purpose='Crawling').get('value', {})
print('nwResp', nwResp)
self.__workerId = nwResp.get('data', {'id': -1}).get('id', -1)
print('Initialized WorkerId: ', self.__workerId)
def main():
pass
if __name__ == '__main__':
main()