Mercurial > hg > svgsitemap
annotate svgsitemap/middleware.py @ 8:1d16bde33eee
take out some image too ::sigh::
author | Jeff Hammel <jhammel@mozilla.com> |
---|---|
date | Wed, 29 Dec 2010 00:25:48 -0800 |
parents | 145a4d85b37d |
children | aa4eab6dc994 |
rev | line source |
---|---|
0 | 1 """ |
2 request dispatcher | |
3 """ | |
4 | |
5 __all__ = ['MapserverMiddleware', 'SVGSiteMap'] | |
6 | |
7 import os | |
1 | 8 import urlparse |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
9 from fnmatch import fnmatch |
0 | 10 from pygraphviz import AGraph |
1 | 11 from webob import Request, Response, exc |
0 | 12 |
13 class MapserverMiddleware(object): | |
14 """silly middleware to serve just the svg""" | |
15 def __init__(self, app, svgmap, path='/map'): | |
1 | 16 self.app = app |
0 | 17 self.svgmap = svgmap |
18 self.path = path | |
19 | |
20 def __call__(self, environ, start_response): | |
21 request = Request(environ) | |
22 if request.path_info == self.path or not self.path: | |
1 | 23 if not os.path.exists(self.svgmap): |
24 res = exc.HTTPNotFound() | |
25 return res(environ, start_response) | |
0 | 26 content = file(self.svgmap).read() |
1 | 27 res = Response(content_type='image/svg+xml', body=content) |
28 return res(environ, start_response) | |
29 return self.app(environ, start_response) | |
0 | 30 |
31 | |
32 class SVGSiteMap(object): | |
33 | |
34 ### class level variables | |
1 | 35 defaults = { 'name': '', |
36 'hosts': '', | |
37 'external_referers': True, | |
2 | 38 'maxwidth': 5, |
39 'minwidth': '0.01', | |
7
145a4d85b37d
exclude long urls for now ::sigh::
Jeff Hammel <jhammel@mozilla.com>
parents:
6
diff
changeset
|
40 'maxlength': 80, |
8
1d16bde33eee
take out some image too ::sigh::
Jeff Hammel <jhammel@mozilla.com>
parents:
7
diff
changeset
|
41 'excluded': '*.css *.js */static/* /css/* *.ico /backgrounds/* *.png *.jpg', |
1 | 42 |
43 # input/output | |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
44 'file': None, # graphviz file |
1 | 45 'output': None, # .svg file |
46 | |
47 # graph attributes | |
0 | 48 'bgcolor': 'black', |
49 'fontcolor': 'white', | |
50 'fontname': 'Helvetica', | |
1 | 51 'fontsize': '10.0', |
0 | 52 'nodecolor': 'aqua', |
53 'edgecolor': 'lime', | |
5 | 54 'shape': 'plaintext', |
1 | 55 'len': '1.3', |
56 'arrowsize': '0.5', | |
0 | 57 } |
58 | |
59 def __init__(self, app, **kw): | |
1 | 60 |
61 # boilerplate | |
0 | 62 self.app = app |
63 self.edges = {} | |
1 | 64 self.max = 0 |
65 | |
66 # set attrs from defaults | |
0 | 67 for key in self.defaults: |
68 setattr(self, key, kw.get(key, self.defaults[key])) | |
1 | 69 |
70 # sanity checks + data fixing | |
0 | 71 assert self.output, "Please give an output file" |
72 assert self.file, "Cannot save file!" | |
2 | 73 self.maxwidth = float(self.maxwidth) |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
74 if isinstance(self.excluded, basestring): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
75 self.excluded = self.excluded.split() |
1 | 76 if self.hosts: |
77 self.hosts = self.hosts.split() | |
78 else: | |
79 self.hosts = [] | |
80 if isinstance(self.external_referers, basestring): | |
81 self.external_referers = self.external_referers.lower() == 'true' | |
82 | |
83 # open the graph | |
0 | 84 if os.path.exists(self.file): |
1 | 85 self.graph = AGraph(self.file, name=self.name, splines=False, directed=True) |
0 | 86 for edge in self.graph.edges(): |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
87 if self.exclude(edge[0], edge[1]): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
88 self.graph.remove_edge(edge[0], edge[1]) |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
89 continue |
1 | 90 count = int(edge.attr['label']) |
91 self.edges[(edge[0], edge[1])] = count | |
92 if count > self.max: | |
93 self.max = count | |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
94 for node in self.graph.nodes(): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
95 if not self.graph.neighbors(node) or self.exclude(node): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
96 self.graph.remove_node(node) |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
97 self.set_widths() |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
98 self.graph.write(self.file) |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
99 self.graph.draw(self.output, prog='neato') |
0 | 100 else: |
1 | 101 self.graph = AGraph(name=self.name, splines=False, directed=True) |
102 | |
103 # make it pretty | |
2 | 104 self.graph.graph_attr['name'] = self.name |
0 | 105 self.graph.graph_attr['label'] = self.name |
106 self.graph.graph_attr['fontname'] = self.fontname | |
107 self.graph.graph_attr['fontcolor'] = self.fontcolor | |
108 self.graph.graph_attr['bgcolor'] = self.bgcolor | |
109 self.graph.node_attr['color'] = self.nodecolor | |
110 self.graph.node_attr['fontcolor'] = self.fontcolor | |
1 | 111 self.graph.node_attr['fontname'] = self.fontname |
112 self.graph.node_attr['fontsize'] = self.fontsize | |
0 | 113 self.graph.node_attr['shape'] = self.shape |
1 | 114 self.graph.node_attr['width'] = '0.1' |
115 self.graph.node_attr['height'] = '0.1' | |
0 | 116 self.graph.edge_attr['color'] = self.edgecolor |
117 self.graph.edge_attr['fontcolor'] = self.fontcolor | |
1 | 118 self.graph.edge_attr['fontname'] = self.fontname |
119 self.graph.edge_attr['fontsize'] = self.fontsize | |
120 self.graph.edge_attr['len'] = self.len | |
121 self.graph.edge_attr['arrowsize'] = self.arrowsize | |
0 | 122 |
123 def __call__(self, environ, start_response): | |
124 request = Request(environ) | |
1 | 125 if request.referer: |
126 | |
127 # parse the URLs | |
128 parsed_referer = urlparse.urlsplit(request.referer) | |
129 parsed_referee = urlparse.urlsplit(request.url) | |
130 islocal = False | |
131 | |
132 # see if its local or not | |
133 localhosts = self.hosts[:] | |
134 if parsed_referee.hostname not in localhosts: | |
135 localhosts.append(parsed_referee.hostname) | |
136 for host in localhosts: | |
137 if parsed_referer.hostname == host or parsed_referer.hostname.endswith('.' + host): | |
138 islocal = True | |
139 break | |
140 | |
141 # make the connection | |
142 if islocal: | |
143 self.add(parsed_referer.path, parsed_referee.path) | |
144 else: | |
145 if self.external_referers: | |
146 self.add(request.referer, parsed_referee.path) | |
147 | |
0 | 148 return self.app(environ, start_response) |
149 | |
150 def add(self, from_url, to_url): | |
1 | 151 """add a conncection in the graph""" |
152 | |
153 if from_url == to_url: | |
154 return # don't do self-references | |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
155 if self.exclude(from_url, to_url): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
156 return # ignore certain urls |
1 | 157 |
0 | 158 if (from_url, to_url) in self.edges: |
159 count = self.edges[(from_url, to_url)] | |
160 count += 1 | |
1 | 161 if count > self.max: |
162 self.max = count | |
0 | 163 self.edges[(from_url, to_url)] = count |
164 edge = self.graph.get_edge(from_url, to_url) | |
165 edge.attr['label'] = str(count) | |
166 else: | |
167 self.edges[(from_url, to_url)] = 1 | |
4 | 168 self.max = 1 |
0 | 169 self.graph.add_edge(from_url, to_url, label='1') |
170 | |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
171 if self.maxwidth: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
172 self.set_widths() |
2 | 173 |
0 | 174 for url in from_url, to_url: |
175 node = self.graph.get_node(url) | |
176 node.attr['label'] = url | |
177 node.attr['href'] = url | |
178 | |
179 if self.file: | |
180 self.graph.write(self.file) | |
181 if self.output: | |
1 | 182 self.graph.draw(self.output, prog='neato') |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
183 |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
184 def exclude(self, *urls): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
185 """tell whether the edge is excluded""" |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
186 for pattern in self.excluded: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
187 for url in urls: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
188 if fnmatch(url, pattern): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
189 return True |
7
145a4d85b37d
exclude long urls for now ::sigh::
Jeff Hammel <jhammel@mozilla.com>
parents:
6
diff
changeset
|
190 for url in urls: |
145a4d85b37d
exclude long urls for now ::sigh::
Jeff Hammel <jhammel@mozilla.com>
parents:
6
diff
changeset
|
191 if len(url) > self.maxlength: |
145a4d85b37d
exclude long urls for now ::sigh::
Jeff Hammel <jhammel@mozilla.com>
parents:
6
diff
changeset
|
192 return True |
6
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
193 return False |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
194 |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
195 def set_widths(self): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
196 if self.maxwidth: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
197 for edge in self.graph.edges(): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
198 count = self.edges[(edge[0], edge[1])] |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
199 width = self.maxwidth * count / self.max |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
200 if not width: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
201 width = self.minwidth |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
202 edge.attr['style'] = 'setlinewidth(%s)' % width |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
203 |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
204 else: |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
205 for edge in self.graph.edges(): |
a88a670c92d0
dont display things that you dont want
Jeff Hammel <jhammel@mozilla.com>
parents:
5
diff
changeset
|
206 edge.attr['style'] = '' |