summaryrefslogtreecommitdiff
path: root/autoimport.py
blob: 453a839f983625d31c301c2be0dc1afa3ebfa034 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#!/usr/bin/python

import gzip
import io
import sqlite3
import subprocess
import sys
import urllib

from debian import deb822
from debian.debian_support import version_compare

def main():
    urlbase = sys.argv[1]
    db = sqlite3.connect("test.sqlite3")
    cur = db.cursor()
    cur.execute("PRAGMA foreign_keys = ON;")
    cur.execute("SELECT package, version FROM package;")
    knownpkgs = dict((row[0], row[1]) for row in cur.fetchall())

    pkglist = urllib.urlopen(urlbase + "/dists/sid/main/binary-amd64/Packages.gz").read()
    pkglist = gzip.GzipFile(fileobj=io.BytesIO(pkglist)).read()
    distpkgs = set()
    for pkg in deb822.Packages.iter_paragraphs(io.BytesIO(pkglist)):
        name = pkg["Package"]
        distpkgs.add(name)
        if name in knownpkgs and \
                version_compare(pkg["Version"], knownpkgs[name]) <= 0:
            continue
        pkgurl = "%s/%s" % (urlbase, pkg["Filename"])
        print("importing %s" % name)
        dl = subprocess.Popen(["curl", "-s", pkgurl], stdout=subprocess.PIPE)
        imp = subprocess.Popen("./importpkg.py", stdin=dl.stdout)
        if imp.wait():
            print("import failed")
        if dl.wait():
            print("curl failed")
    
    delpkgs = set(knownpkgs) - distpkgs
    print("clearing packages %s" % " ".join(delpkgs))
    cur.executemany("DELETE FROM package WHERE package = ?;",
                    ((pkg,) for pkg in delpkgs))
    # Tables content, dependency and sharing will also be pruned
    # due to ON DELETE CASCADE clauses.
    db.commit()

if __name__ == "__main__":
    main()