~ubuntu-branches/ubuntu/maverick/python-debian/maverick

Viewing changes to debian_bundle/debtags.py

Committer: Bazaar Package Importer
Author(s): John Wright
Date: 2008-04-30 23:58:24 UTC
mfrom: (1.1.9 hardy)
Revision ID: james.westby@ubuntu.com-20080430235824-iq9mp0fbd0efmruv

Tags: 0.1.10

http://bugs.debian.org/473254

http://bugs.debian.org/473259

* debian_bundle/deb822.py, tests/test_deb822.py:
  - Do not cache _CaseInsensitiveString objects, since it causes case
    preservation issues under certain circumstances (Closes: #473254)
  - Add a test case
* debian_bundle/deb822.py:
  - Add support for fixed-length subfields in multivalued fields.  I updated
    the Release and PdiffIndex classes to use this.  The default behavior for
    Release is that of apt-ftparchive, just because it's simpler.  Changing
    the behavior to resemble dak requires simply setting the
    size_field_behavior attribute to 'dak'.  (Ideally, deb822 would detect
    which behavior to use if given an actual Release file as input, but this
    is not implemented yet.)  (Closes: #473259)
  - Add support for Checksums-{Sha1,Sha256} multivalued fields in Dsc and
    Changes classes
* debian/control:
  - "python" --> "Python" in the Description field
  - Change the section to "python"

files added:
HISTORY.deb822

TODO

deb822.py

debian/NEWS

debian/pyversions

debian_bundle/arfile.py

debian_bundle/debfile.py

examples/changelog/changelog_to_file

examples/deb822

examples/deb822/grep-maintainer

examples/deb822/grep_native_packages.py

examples/debfile

examples/debfile/ar

examples/debfile/changelog_head

examples/debfile/dpkg-info

examples/debfile/extract_cron

examples/debtags/pkgwalk

examples/debtags/tagminer

setup.py.in

tests

tests/test-broken.deb.uu

tests/test.deb.uu

tests/test_changelog

tests/test_deb822.py

tests/test_debfile.py

tests/test_debtags.py

tests/test_modify_changelog1

tests/test_modify_changelog2

tests/test_modify_changelog3

tests/test_strange_changelog

tests/test_tagdb

files removed:
debian_bundle/test_changelog

debian_bundle/test_deb822.py

debian_bundle/test_debtags.py

debian_bundle/test_modify_changelog1

debian_bundle/test_modify_changelog2

debian_bundle/test_modify_changelog3

debian_bundle/test_tagdb

setup.py

files modified:
README

README.changelog

README.deb822

debian/changelog

debian/control

debian/copyright

debian/docs

debian/rules

debian_bundle/changelog.py

debian_bundle/deb822.py

debian_bundle/debian_support.py

debian_bundle/debtags.py

Show diffs side-by-side

added added

removed removed

debian_bundle/debtags.py

# debtags.py -- Access and manipulate Debtags information

# This library is free software; you can redistribute it and/or

# modify it under the terms of the GNU Lesser General Public

# License as published by the Free Software Foundation; either

# version 2.1 of the License, or (at your option) any later version.

# This library is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# This program is free software: you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation, either version 3 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful, but

# WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

# Lesser General Public License for more details.

# You should have received a copy of the GNU Lesser General Public

# License along with this library; if not, write to the Free Software

# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA

# General Public License for more details.

# TODO: install python-epydoc and try to autogenerate documntation from that

import math

# You should have received a copy of the GNU General Public License

# along with this program. If not, see <http://www.gnu.org/licenses/>.

import math, re, cPickle

def parseTags(input):

lre = re.compile(r"^(.+?)(?::?\s*|:\s+(.+?)\s*)$")

for line in input:

# Is there a way to remove the last character of a line that does not

# make a copy of the entire line?

m = lre.match(line)

pkgs = set(m.group(1).split(', '))

if m.group(2):

tags = set(m.group(2).split(', '))

else:

tags = set()

yield pkgs, tags

def readTagDatabase(input):

"Read the tag database, returning a pkg->tags dictionary"

db = {}

for line in input:

# Is there a way to remove the last character of a line that does not

# make a copy of the entire line?

line = line.rstrip("\n")

pkgs, tags = line.split(": ")

for pkgs, tags in parseTags(input):

# Create the tag set using the native set

tags = set(tags.split(", "))

for p in pkgs.split(", "):

for p in pkgs:

db[p] = tags.copy()

return db;

def readTagDatabaseReversed(input):

"Read the tag database, returning a tag->pkgs dictionary"

db = {}

for line in input:

# Is there a way to remove the last character of a line that does not

# make a copy of the entire line?

line = line.rstrip("\n")

pkgs, tags = line.split(": ")

for pkgs, tags in parseTags(input):

# Create the tag set using the native set

pkgs = set(pkgs.split(", "))

for tag in tags.split(", "):

for tag in tags:

if db.has_key(tag):

db[tag] |= pkgs

else:

"Read the tag database, returning a pkg->tags and a tag->pkgs dictionary"

db = {}

dbr = {}

for line in input:

# Is there a way to remove the last character of a line that does not

# make a copy of the entire line?

line = line.rstrip("\n")

pkgs, tags = line.split(": ")

for pkgs, tags in parseTags(input):

# Create the tag set using the native set

pkgs = set(pkgs.split(", "))

if tagFilter == None:

tags = set(tags.split(", "))

tags = set(tags)

else:

tags = set(filter(tagFilter, tags.split(', ')))

tags = set(filter(tagFilter, tags))

for pkg in pkgs:

db[pkg] = tags.copy()

for tag in tags:

149

142

"""

150

143

self.db, self.rdb = readTagDatabaseBothWays(input, tagFilter)

151

144

145

def qwrite(self, file):

146

"Quickly write the data to a pickled file"

147

cPickle.dump(self.db, file)

148

cPickle.dump(self.rdb, file)

149

150

def qread(self, file):

151

"Quickly read the data from a pickled file"

152

self.db = cPickle.load(file)

153

self.rdb = cPickle.load(file)

154

152

155

def insert(self, pkg, tags):

153

156

self.db[pkg] = tags.copy()

154

157

for tag in tags:

170

173

res.rdb = self.db

171

174

return res

172

175

176

def facetCollection(self):

177

"""

178

Return a copy of this collection, but replaces the tag names

179

with only their facets.

180

"""

181

fcoll = DB()

182

tofacet = re.compile(r"^([^:]+).+")

183

for pkg, tags in self.iterPackagesTags():

184

ftags = set([tofacet.sub(r"\1", t) for t in tags])

185

fcoll.insert(pkg, ftags)

186

return fcoll

187

188

def copy(self):

189

"""

190

Return a copy of this collection, with the tagsets copied as

191

well.

192

"""

193

res = DB()

194

res.db = self.db.copy()

195

res.rdb = self.rdb.copy()

196

return res

197

173

198

def reverseCopy(self):

174

199

"""

175

200

Return the reverse collection, with a copy of the tagsets of

176

this one

201

this one.

177

202

"""

178

203

res = DB()

179

204

res.db = self.rdb.copy()

209

234

def filterPackages(self, packageFilter):

210

235

"""

211

236

Return a collection with only those packages that match a

212

filter, sharing tagsets with this one

237

filter, sharing tagsets with this one. The filter will match

238

on the package.

213

239

"""

214

240

res = DB()

215

241

db = {}

222

248

def filterPackagesCopy(self, filter):

223

249

"""

224

250

Return a collection with only those packages that match a

225

filter, with a copy of the tagsets of this one

251

filter, with a copy of the tagsets of this one. The filter

252

will match on the package.

226

253

"""

227

254

res = DB()

228

255

db = {}

232

259

res.rdb = reverse(db)

233

260

return res

234

261

262

def filterPackagesTags(self, packageTagFilter):

263

"""

264

Return a collection with only those packages that match a

265

filter, sharing tagsets with this one. The filter will match

266

on (package, tags).

267

"""

268

res = DB()

269

db = {}

270

for pkg, tags in filter(packageTagFilter, self.db.iteritems()):

271

db[pkg] = self.db[pkg]

272

res.db = db

273

res.rdb = reverse(db)

274

return res

275

276

def filterPackagesTagsCopy(self, packageTagFilter):

277

"""

278

Return a collection with only those packages that match a

279

filter, with a copy of the tagsets of this one. The filter

280

will match on (package, tags).

281

"""

282

res = DB()

283

db = {}

284

for pkg, tags in filter(packageTagFilter, self.db.iteritems()):

285

db[pkg] = self.db[pkg].copy()

286

res.db = db

287

res.rdb = reverse(db)

288

return res

289

290

def filterTags(self, tagFilter):

291

"""

292

Return a collection with only those tags that match a

293

filter, sharing package sets with this one. The filter will match

294

on the tag.

295

"""

296

res = DB()

297

rdb = {}

298

for tag in filter(tagFilter, self.rdb.iterkeys()):

299

rdb[tag] = self.rdb[tag]

300

res.rdb = rdb

301

res.db = reverse(rdb)

302

return res

303

304

def filterTagsCopy(self, tagFilter):

305

"""

306

Return a collection with only those tags that match a

307

filter, with a copy of the package sets of this one. The

308

filter will match on the tag.

309

"""

310

res = DB()

311

rdb = {}

312

for tag in filter(tagFilter, self.rdb.iterkeys()):

313

rdb[tag] = self.rdb[tag].copy()

314

res.rdb = rdb

315

res.db = reverse(rdb)

316

return res

317

235

318

def hasPackage(self, pkg):

236

319

"""Check if the collection contains the given package"""

237

320

return self.db.has_key(pkg)

346

429

return set(tags[:1])

347

430

else:

348

431

return tagset

432

433

def correlations(self):

434

"""

435

Generate the list of correlation as a tuple (hastag, hasalsotag, score).

436

437

Every touple will indicate that the tag 'hastag' tends to also

438

have 'hasalsotag' with a score of 'score'.

439

"""

440

for pivot in self.iterTags():

441

with_ = self.filterPackagesTags(lambda pt: pivot in pt[1])

442

without = self.filterPackagesTags(lambda pt: pivot not in pt[1])

443

for tag in with_.iterTags():

444

if tag == pivot: continue

445

has = float(with_.card(tag)) / float(with_.packageCount())

446

hasnt = float(without.card(tag)) / float(without.packageCount())

447

yield pivot, tag, has - hasnt

Older »