summaryrefslogtreecommitdiff
path: root/update_sharing.py
diff options
context:
space:
mode:
authorHelmut Grohne <helmut@subdivi.de>2013-07-25 13:28:19 +0200
committerHelmut Grohne <helmut@subdivi.de>2013-07-25 13:28:19 +0200
commit9b653583711c59d96c45af43ff8ee9534500adb6 (patch)
treeaca58a607a571f1f46294e2cfa4f20ce06746771 /update_sharing.py
parent796eeb217e449234b777512451c5b668837c9118 (diff)
downloaddebian-dedup-9b653583711c59d96c45af43ff8ee9534500adb6.tar.gz
display "issues" with files in package view
Currently this is invalid .gz files and png files not named .png.
Diffstat (limited to 'update_sharing.py')
-rwxr-xr-xupdate_sharing.py3
1 files changed, 3 insertions, 0 deletions
diff --git a/update_sharing.py b/update_sharing.py
index 55e8096..62a3ab5 100755
--- a/update_sharing.py
+++ b/update_sharing.py
@@ -43,6 +43,7 @@ def main():
cur.execute("PRAGMA foreign_keys = ON;")
cur.execute("DELETE FROM sharing;")
cur.execute("DELETE FROM duplicate;")
+ cur.execute("DELETE FROM issue;")
readcur = db.cursor()
readcur.execute("SELECT hash FROM hash GROUP BY hash HAVING count(*) > 1;")
for hashvalue, in fetchiter(readcur):
@@ -54,6 +55,8 @@ def main():
cur.executemany("INSERT OR IGNORE INTO duplicate (cid) VALUES (?);",
[(row[1],) for row in rows])
process_pkgdict(cur, pkgdict)
+ cur.execute("INSERT INTO issue (cid, issue) SELECT content.id, 'file named something.gz is not a valid gzip file' FROM content WHERE content.filename LIKE '%.gz' AND NOT EXISTS (SELECT 1 FROM hash WHERE hash.cid = content.id AND hash.function = 'gzip_sha512');")
+ cur.execute("INSERT INTO issue (cid, issue) SELECT content.id, 'png image not named something.png' FROM content JOIN hash ON content.id = hash.cid WHERE function = 'image_sha512' AND lower(filename) NOT LIKE '%.png';")
db.commit()
if __name__ == "__main__":