From d6a73f2b37f500f6c7fdbbd918e2a401109598b3 Mon Sep 17 00:00:00 2001 From: Helmut Grohne Date: Mon, 4 Mar 2013 13:49:22 +0100 Subject: webapp: generate /comparison pages in constant-space --- webapp.py | 46 +++++++++++++++++++++++++++------------------- 1 file changed, 27 insertions(+), 19 deletions(-) (limited to 'webapp.py') diff --git a/webapp.py b/webapp.py index 4a586dd..1f19891 100755 --- a/webapp.py +++ b/webapp.py @@ -69,17 +69,15 @@ detail_template = jinjaenv.from_string( {% block title %}sharing between {{ details1.package|e }} and {{ details2.package|e }}{% endblock%} {% block content %}

{{ details1.package|e }} <-> {{ details2.package|e }}

-{%- if shared -%} - {%- for entry in shared|sort(attribute="size1", reverse=true) -%} + {%- for entry in shared -%} {%- endfor -%}
{{ details1.package|e }}{{ details2.package|e }}
sizefilenamehash functionssizefilenamehash functions
{{ entry.size1|format_size }}{{ entry.filename1 }} {%- for funccomb, hashvalue in entry.functions.items() %}{{ funccomb[0]|e }} {% endfor %} {{ entry.size2|format_size }}{{ entry.filename2 }} {%- for funccomb, hashvalue in entry.functions.items() %}{{ funccomb[1]|e }} {% endfor %}
-{%- endif -%} {% endblock %}""") hash_template = jinjaenv.from_string( @@ -158,6 +156,27 @@ def html_response(unicode_iterator, max_age=24 * 60 * 60): resp.expires = datetime.datetime.now() + datetime.timedelta(seconds=max_age) return resp +def generate_shared(rows): + """internal helper from show_detail""" + entry = None + for filename1, size1, func1, filename2, size2, func2, hashvalue in rows: + funccomb = (func1, func2) + if funccomb not in hash_functions: + continue + if entry and (entry["filename1"] != filename1 or + entry["filename2"] != filename2): + yield entry + entry = None + if entry: + funcdict = entry["functions"] + else: + funcdict = dict() + entry = dict(filename1=filename1, filename2=filename2, size1=size1, + size2=size2, functions=funcdict) + funcdict[funccomb] = hashvalue + if entry: + yield entry + class Application(object): def __init__(self, db): self.db = db @@ -248,32 +267,21 @@ class Application(object): if package1 == package2: details1 = details2 = self.get_details(package1) - cur.execute("SELECT a.filename, a.size, a.function, b.filename, b.size, b.function, a.hash FROM content AS a JOIN content AS b ON a.hash = b.hash WHERE a.package = ? AND b.package = ? AND a.filename != b.filename;", + cur.execute("SELECT a.filename, a.size, a.function, b.filename, b.size, b.function, a.hash FROM content AS a JOIN content AS b ON a.hash = b.hash WHERE a.package = ? AND b.package = ? AND a.filename != b.filename ORDER BY a.size DESC, a.filename, b.filename;", (package1, package1)) else: details1 = self.get_details(package1) details2 = self.get_details(package2) - cur.execute("SELECT a.filename, a.size, a.function, b.filename, b.size, b.function, a.hash FROM content AS a JOIN content AS b ON a.hash = b.hash WHERE a.package = ? AND b.package = ?;", + cur.execute("SELECT a.filename, a.size, a.function, b.filename, b.size, b.function, a.hash FROM content AS a JOIN content AS b ON a.hash = b.hash WHERE a.package = ? AND b.package = ? ORDER BY a.size DESC, a.filename, b.filename;", (package1, package2)) - - shared = dict() - for filename1, size1, func1, filename2, size2, func2, hashvalue in fetchiter(cur): - funccomb = (func1, func2) - if funccomb not in hash_functions: - continue - funcdict = shared.setdefault((filename1, filename2), - (size1, size2, dict()))[2] - funcdict[(func1, func2)] = hashvalue - shared = [dict(filename1=filename1, filename2=filename2, size1=size1, - size2=size2, functions=functions) - for (filename1, filename2), (size1, size2, functions) - in shared.items()] + shared = generate_shared(fetchiter(cur)) + # The cursor will be in use until the template is fully rendered. params = dict( details1=details1, details2=details2, shared=shared) - return html_response(detail_template.render(params)) + return html_response(detail_template.stream(params)) def show_hash(self, function, hashvalue): cur = self.db.cursor() -- cgit v1.2.3