2015-07-17 23:44:26 +00:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
|
|
|
import os
|
2015-07-18 03:49:24 +00:00
|
|
|
import json
|
2015-07-18 05:35:57 +00:00
|
|
|
import pprint
|
2015-07-18 03:17:27 +00:00
|
|
|
# Can't use trollius because then onConnect never gets called
|
2015-07-18 03:33:57 +00:00
|
|
|
# https://github.com/tavendo/AutobahnPython/issues/426
|
2015-07-17 23:44:26 +00:00
|
|
|
import asyncio
|
|
|
|
from autobahn.asyncio.websocket import WebSocketServerFactory, WebSocketServerProtocol
|
|
|
|
|
2015-07-18 10:57:57 +00:00
|
|
|
class GrabberServerProtocol(WebSocketServerProtocol):
|
2015-07-18 02:11:18 +00:00
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
2015-07-18 13:29:19 +00:00
|
|
|
self.mode = None
|
2015-07-18 02:11:18 +00:00
|
|
|
|
2015-07-17 23:44:26 +00:00
|
|
|
def onConnect(self, request):
|
2015-07-18 02:11:18 +00:00
|
|
|
self.peer = request.peer
|
2015-07-18 08:26:58 +00:00
|
|
|
print("{} connected".format(self.peer))
|
2015-07-18 02:11:18 +00:00
|
|
|
self.factory.clients.add(self)
|
|
|
|
|
|
|
|
def onClose(self, wasClean, code, reason):
|
2015-07-18 08:26:58 +00:00
|
|
|
print("{} disconnected".format(self.peer))
|
2016-02-24 16:03:34 -06:00
|
|
|
self.factory.clients.discard(self)
|
2015-07-18 02:11:18 +00:00
|
|
|
|
2015-07-18 05:24:54 +00:00
|
|
|
def broadcastToDashboards(self, obj):
|
|
|
|
for client in self.factory.clients:
|
|
|
|
if client.mode == "dashboard":
|
2015-07-18 05:35:57 +00:00
|
|
|
##print("Broadcasting", pprint.pformat(obj))
|
2015-07-18 05:24:54 +00:00
|
|
|
client.sendMessage(json.dumps(obj).encode("utf-8"))
|
|
|
|
|
2015-07-18 02:11:18 +00:00
|
|
|
def onMessage(self, payload, isBinary):
|
2015-07-18 05:24:54 +00:00
|
|
|
##print(payload)
|
2015-07-18 02:11:18 +00:00
|
|
|
obj = json.loads(payload.decode('utf-8'))
|
|
|
|
type = obj["type"]
|
2015-07-18 13:32:26 +00:00
|
|
|
if self.mode is None and type == "hello" and obj.get("mode"):
|
2015-07-18 02:11:18 +00:00
|
|
|
mode = obj['mode']
|
|
|
|
if mode in ('dashboard', 'grabber'):
|
2015-07-18 13:29:19 +00:00
|
|
|
self.mode = mode
|
2015-07-18 08:26:58 +00:00
|
|
|
if mode == "grabber":
|
|
|
|
print("{} is grabbing {}".format(self.peer, obj['url']))
|
2015-07-18 13:29:19 +00:00
|
|
|
elif mode == "dashboard":
|
|
|
|
print("{} is dashboarding with {}".format(self.peer, obj['user_agent']))
|
2015-07-18 13:35:11 +00:00
|
|
|
elif self.mode == "grabber":
|
|
|
|
if type == "download":
|
|
|
|
self.broadcastToDashboards({
|
|
|
|
"type": type,
|
|
|
|
"job_data": obj["job_data"],
|
|
|
|
"url": obj["url"],
|
|
|
|
"response_code": obj["response_code"],
|
|
|
|
"wget_code": obj["response_message"]
|
|
|
|
})
|
|
|
|
elif type in ("stdout", "stderr"):
|
|
|
|
self.broadcastToDashboards({
|
|
|
|
"type": type,
|
|
|
|
"job_data": obj["job_data"],
|
|
|
|
"message": obj["message"]
|
|
|
|
})
|
|
|
|
elif type == "ignore":
|
|
|
|
self.broadcastToDashboards({
|
|
|
|
"type": type,
|
|
|
|
"job_data": obj["job_data"],
|
|
|
|
"url": obj["url"],
|
|
|
|
"pattern": obj["pattern"],
|
|
|
|
})
|
2015-07-17 23:44:26 +00:00
|
|
|
|
2016-02-24 16:44:13 -06:00
|
|
|
# Called when we get an HTTP request instead of a WebSocket request
|
2016-02-24 16:03:34 -06:00
|
|
|
def sendServerStatus(self, redirectUrl=None, redirectAfter=0):
|
|
|
|
requestPath = self.http_request_uri.split("?")[0]
|
|
|
|
if requestPath == "/":
|
|
|
|
with open(os.path.join(os.path.dirname(__file__), "dashboard.html"), "r") as f:
|
|
|
|
dashboardHtml = f.read()
|
|
|
|
self.sendHtml(dashboardHtml)
|
|
|
|
else:
|
2016-02-24 16:44:13 -06:00
|
|
|
self.send404()
|
2016-02-24 16:03:34 -06:00
|
|
|
|
|
|
|
def send404(self):
|
|
|
|
with open(os.path.join(os.path.dirname(__file__), "404.html"), "r") as f:
|
|
|
|
responseHtml = f.read()
|
|
|
|
response = "HTTP/1.1 404 Not Found\x0d\x0a"
|
|
|
|
response += "Content-Type: text/html; charset=UTF-8\x0d\x0a"
|
2016-02-24 16:44:13 -06:00
|
|
|
response += "Content-Length: {}\x0d\x0a".format(len(responseHtml))
|
2016-02-24 16:03:34 -06:00
|
|
|
response += "\x0d\x0a"
|
|
|
|
response += responseHtml
|
|
|
|
self.sendData(response.encode("utf_8"))
|
2015-07-17 23:44:26 +00:00
|
|
|
|
2015-07-18 10:57:57 +00:00
|
|
|
class GrabberServerFactory(WebSocketServerFactory):
|
|
|
|
protocol = GrabberServerProtocol
|
2015-07-18 02:11:18 +00:00
|
|
|
|
|
|
|
def __init__(self):
|
|
|
|
super().__init__()
|
|
|
|
self.clients = set()
|
|
|
|
|
|
|
|
|
2015-07-17 23:44:26 +00:00
|
|
|
def main():
|
|
|
|
loop = asyncio.get_event_loop()
|
|
|
|
|
2016-02-24 16:03:34 -06:00
|
|
|
port = int(os.environ.get('GRAB_SITE_PORT', 29000))
|
|
|
|
interface = os.environ.get('GRAB_SITE_INTERFACE', '0.0.0.0')
|
2015-07-17 23:44:26 +00:00
|
|
|
|
2016-02-24 16:03:34 -06:00
|
|
|
factory = GrabberServerFactory()
|
|
|
|
coro = loop.create_server(factory, interface, port)
|
|
|
|
loop.run_until_complete(coro)
|
2015-07-17 23:44:26 +00:00
|
|
|
|
2016-02-24 16:03:34 -06:00
|
|
|
print("grab-site server started on {}:{}".format(interface, port))
|
2015-07-17 23:44:26 +00:00
|
|
|
|
|
|
|
loop.run_forever()
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
main()
|