annotate service/reasoning/sse_collector.py @ 296:233b81cf2712

start sse_collector Ignore-this: eba53ef3b8b7b34089e018595c41d202
author drewp@bigasterisk.com
date Fri, 19 Aug 2016 10:54:38 -0700
parents
children 8d89da1915df
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
296
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
1 """
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
2 requesting /graph/foo returns an SSE patch stream that's the
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
3 result of fetching multiple other SSE patch streams. The result stream
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
4 may include new statements injected by this service.
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
5
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
6 Future:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
7 - filter out unneeded stmts from the sources
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
8 - give a time resolution and concatenate patches faster than that res
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
9 """
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
10
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
11 config = {
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
12 'streams': [
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
13 {'id': 'home',
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
14 'sources': [
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
15 #'http://bang:9059/graph/events',
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
16 'http://plus:9075/graph/events',
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
17 ]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
18 },
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
19 ]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
20 }
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
21
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
22 from crochet import no_setup
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
23 no_setup()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
24
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
25 import sys, logging, weakref, traceback, json
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
26 from twisted.internet import reactor
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
27 import cyclone.web, cyclone.sse
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
28 from rdflib import ConjunctiveGraph
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
29 from rdflib.parser import StringInputSource
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
30 from docopt import docopt
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
31
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
32 from twisted_sse_demo.eventsource import EventSource
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
33
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
34 sys.path.append("../../lib")
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
35 from logsetup import log
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
36 from patchablegraph import patchAsJson
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
37
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
38 sys.path.append("/my/proj/light9")
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
39 from light9.rdfdb.patch import Patch
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
40
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
41 def patchFromJson(j):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
42 body = json.loads(j)['patch']
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
43 a = ConjunctiveGraph()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
44 a.parse(StringInputSource(json.dumps(body['adds'])), format='json-ld')
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
45 d = ConjunctiveGraph()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
46 d.parse(StringInputSource(json.dumps(body['deletes'])), format='json-ld')
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
47 return Patch(addGraph=a, delGraph=d)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
48
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
49 class PatchSource(object):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
50 """wrap EventSource so it emits Patch objects and has an explicit stop method"""
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
51 def __init__(self, url):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
52 self.url = url
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
53 self._listeners = set()#weakref.WeakSet()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
54 log.info('start read from %s', url)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
55 self._eventSource = EventSource(url)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
56 self._eventSource.protocol.delimiter = '\n'
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
57
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
58 self._eventSource.addEventListener('fullGraph', self._onFullGraph)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
59 self._eventSource.addEventListener('patch', self._onMessage)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
60
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
61 def _onFullGraph(self, message):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
62 try:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
63 g = ConjunctiveGraph()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
64 g.parse(StringInputSource(message), format='json-ld')
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
65 p = Patch(addGraph=g)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
66 self._sendPatch(p)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
67 except:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
68 traceback.print_exc()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
69
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
70 def _onMessage(self, message):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
71 try:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
72 p = patchFromJson(message)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
73 self._sendPatch(p)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
74 except:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
75 traceback.print_exc()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
76
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
77 def _sendPatch(self, p):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
78 log.info('output patch to %s listeners', p, len(self._listeners))
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
79 for lis in self._listeners:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
80 lis(p)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
81
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
82 def addPatchListener(self, func):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
83 self._listeners.add(func)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
84
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
85 def stop(self):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
86 log.info('stop read from %s', self.url)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
87 self._eventSource.protocol.stopProducing() #?
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
88 self._eventSource = None
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
89
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
90 def __del__(self):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
91 if self._eventSource:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
92 raise ValueError
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
93
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
94 class GraphClient(object):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
95 """A listener of some EventSources that sends patches to one of our clients."""
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
96
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
97 def __init__(self, handler, patchSources):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
98 self.handler = handler
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
99
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
100 for ps in patchSources:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
101 ps.addPatchListener(self.onPatch)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
102
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
103 def onPatch(self, p):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
104 self.handler.sendEvent(message=patchAsJson(p), event='patch')
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
105
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
106 class GraphClients(object):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
107 """All the active EventClient objects"""
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
108 def __init__(self):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
109 self.clients = {} # url: EventClient
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
110 self.listeners = {} # url: [GraphClient]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
111
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
112 def addSseHandler(self, handler, streamId):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
113 log.info('addSseHandler %r %r', handler, streamId)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
114 matches = [s for s in config['streams'] if s['id'] == streamId]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
115 if len(matches) != 1:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
116 raise ValueError("%s matches for %r" % (len(matches), streamId))
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
117 ecs = []
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
118 for source in matches[0]['sources']:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
119 if source not in self.clients:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
120 self.clients[source] = PatchSource(source)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
121 ecs.append(self.clients[source])
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
122
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
123 self.listeners.setdefault(source, []).append(GraphClient(handler, ecs))
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
124 print self.__dict__
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
125
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
126 def removeSseHandler(self, handler):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
127 log.info('removeSseHandler %r', handler)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
128 for url, graphClients in self.listeners.items():
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
129 keep = []
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
130 for gc in graphClients:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
131 if gc.handler != handler:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
132 keep.append(gc)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
133 graphClients[:] = keep
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
134 if not keep:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
135 self.clients[url].stop()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
136 del self.clients[url]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
137 del self.listeners[url]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
138
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
139 class SomeGraph(cyclone.sse.SSEHandler):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
140 def __init__(self, application, request):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
141 cyclone.sse.SSEHandler.__init__(self, application, request)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
142 self.id = request.uri[len('/graph/'):]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
143 self.graphClients = self.settings.graphClients
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
144
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
145 def bind(self):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
146 self.graphClients.addSseHandler(self, self.id)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
147
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
148 def unbind(self):
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
149 self.graphClients.removeSseHandler(self)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
150
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
151 if __name__ == '__main__':
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
152
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
153 arg = docopt("""
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
154 Usage: sse_collector.py [options]
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
155
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
156 -v Verbose
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
157 """)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
158
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
159 if arg['-v']:
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
160 import twisted.python.log
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
161 twisted.python.log.startLogging(sys.stdout)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
162 log.setLevel(logging.DEBUG)
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
163
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
164
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
165 graphClients = GraphClients()
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
166
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
167 reactor.listenTCP(
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
168 9071,
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
169 cyclone.web.Application(
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
170 handlers=[
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
171 (r'/graph/(.*)', SomeGraph),
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
172 ],
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
173 graphClients=graphClients),
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
174 interface='::')
233b81cf2712 start sse_collector
drewp@bigasterisk.com
parents:
diff changeset
175 reactor.run()