1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
|
#!/usr/bin/env python
import os, sys
from datetime import datetime
from fnmatch import fnmatch
from pkgcore.config import load_config
from pkgcore.cache import metadata
from pkgcore.ebuild import repository
from sqlalchemy import create_engine
from sqlalchemy.orm import scoped_session, sessionmaker
from sqlalchemy.orm.exc import NoResultFound
path = os.path.join(os.path.dirname(__file__), os.path.pardir)
sys.path.insert(0, path)
from grumpy.models import Base, Category, Developer, Ebuild, Herd, Package
def main(path):
engine = create_engine('postgresql://grumpy:grumpy@localhost/grumpy')
session = scoped_session(sessionmaker(autocommit=False,
autoflush=False,
bind=engine))
Base.query = session.query_property()
# pkgcore part to fetch all the ebuild information
conf = load_config()
eclass_cache = conf.eclass_cache['eclass stack']
cache = metadata.database(readonly=True, location=path)
repo = repository.UnconfiguredTree(path, cache=cache, \
eclass_cache=eclass_cache)
def extract_version(pkg, cpv):
"""..."""
return cpv[len(pkg)+1:-7]
def package_update(cat, pkg, files, mtime):
"""Update package information in database."""
# Fetch package from database
package = Package.query.filter_by(cat=cat).filter_by(pkg=pkg).first()
# Check whether package in database is up-to-date
if package and package.mtime == datetime.fromtimestamp(mtime):
assert len(package.ebuilds) == len(files)
return
print "DEBUG: updating package %s/%s" % (cat, pkg)
# No ebuilds for package?
if len(files) == 0:
# TODO, need to check whether there's been pkgmove
raise NotImplementedError
pack = repo[(cat, pkg, extract_version(pkg, files[0]))]
# Update or create new package
if not package:
package = Package(pack.category, pack.package, pack.description, \
pack.longdescription, pack.homepage, mtime)
session.add(package)
else:
# Update package fields
package.cat = pack.category
package.pkg = pack.package
package.desc = pack.description
package.ldesc = pack.longdescription
package.homepage = pack.homepage
package.mtime = datetime.fromtimestamp(mtime)
# Add/Update devs and herds
new = [d.email for d in pack.maintainers]
old = [d.email for d in package.devs]
# Remove links to removed developers
for dev in [item for item in old if item not in new]:
print "DEBUG: removing developer reference:", dev
package.devs.remove(Developer.query.filter_by(email=dev).one())
# Add/update new developers
for dev in new:
if dev in old:
continue
print "DEBUG: adding developer reference:", dev
d = Developer.query.filter_by(email=dev).first()
if not d:
print "DEBUG: adding new developer to database:", dev
d = Developer(dev)
package.devs.append(d)
# Handle herds
new = []
for herd in pack.herds:
if herd is None:
herd = 'fix-me'
new.append(herd.strip())
old = [h.name for h in package.herds]
for herd in [item for item in old if item not in new]:
print "DEBUG: removing herd reference", herd
package.herds.remove(Herd.query.filter_by(name=herd).one())
for herd in new:
if herd in old:
continue
print "DEBUG: adding herd reference:", herd
h = Herd.query.filter_by(name=herd).first()
if not h:
print "DEBUG: adding new herd to database:", herd
h = Herd(herd)
package.herds.append(h)
# Handle ebuilds
new = [extract_version(pkg, file) for file in files]
old = [e.version for e in package.ebuilds]
print "DEBUG: old: ", old
print "DEBUG: new: ", new
print "DEBUG: diff", [item for item in new if item not in old]
for ver in [item for item in old if item not in new]:
# Delete old ebuilds
ebuild = Ebuild.query.filter_by(cpv="%s/%s-%s" % (pkg, cat, ver)).first()
if not ebuild:
print "Corruption detected: ebuild not found in database"
raise RuntimeError
session.delete(ebuild)
# Updates/add new ebuilds
for ver in new:
ebuild = repo[(cat, pkg, ver)]
if ver not in old:
iuse = list()
fiuse = list()
for u in ebuild.iuse:
if u[0] == '+':
iuse.append(u[1:])
fiuse.append(u[1:])
else:
iuse.append(u)
package.ebuilds.append(Ebuild(package, ebuild.fullver, \
ebuild.eapi, ebuild.slot, \
ebuild.keywords, iuse, fiuse))
continue
# FIXME: use package.ebuilds for lookup
oeb = Ebuild.query.filter_by(cpv="%s/%s-%s" % (pkg, cat, ver)).first()
if not oeb:
print "Ebuild must be in database, corruption detected"
raise RuntimeError
iuse = list()
fiuse = list()
for u in ebuild.iuse:
if u[0] == '+':
iuse.append(u[1:])
fiuse.append(u[1:])
else:
iuse.append(u)
oeb.iuse = iuse
oeb.fiuse = fiuse
oeb.eapi = ebuild.eapi
oeb.slot = ebuild.slot
oeb.keywords = list(ebuild.keywords)
session.commit()
# Compare list of categories in portage vs database
cat_sql = [c.cat for c in Category.query.all()]
cats = repo.categories.keys()
# Store for later
cat_diff = list(set(cat_sql) | set(cats))
# TODO
# save/del categories from database
# Traverse portage
for cat in cats:
catdir = os.path.join(path, cat)
pkgs = os.listdir(catdir)
# TODO
# handle package moves (when one isn't in tree and when one is..)
for pkg in pkgs:
dir = os.path.join(catdir, pkg)
if not os.path.isdir(dir):
continue
files = [f for f in os.listdir(dir) if fnmatch(f, '*.ebuild')]
package_update(cat, pkg, files, int(os.stat(dir).st_mtime))
if __name__ == '__main__':
if len(sys.argv) != 2:
print "Please provide path to portage directory as argument"
sys.exit()
main(sys.argv[1])
|