File: tagsbyrelevance

package info (click to toggle)
python-debian 0.1.18%2Bsqueeze1
  • links: PTS, VCS
  • area: main
  • in suites: squeeze
  • size: 616 kB
  • ctags: 642
  • sloc: python: 4,141; makefile: 49
file content (52 lines) | stat: -rw-r--r-- 1,771 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#!/usr/bin/python

# debtags - Implement package tags support for Debian
#
# Copyright (C) 2003--2006  Enrico Zini <enrico@debian.org>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

import sys
import re
from debian import debtags

if len(sys.argv) < 2:
	print sys.stderr, "Usage: %s tagdb [packagelist]" % (sys.argv[0])
	sys.exit(1)

full = debtags.DB()
# Read full database
tag_filter = re.compile(r"^special::.+$|^.+::TODO$")
full.read(open(sys.argv[1], "r"), lambda x: not tag_filter.match(x))

# Read the package list and create the subcollection
input = len(sys.argv) > 2 and open(sys.argv[2],"r") or sys.stdin
pkgs = set()
for pkg in input:
	# Tolerate apt-cache search output as well
	pkg, none = pkg.rstrip("\n").split(' - ', 1)
	pkgs.add(pkg)

sub = full.choose_packages(pkgs)

rel_index = debtags.relevance_index_function(full, sub)

# Get all the tags sorted by increasing relevance
tags = sorted(sub.iter_tags(), lambda a, b: cmp(rel_index(a), rel_index(b)))

## And finally print them
for tag in tags:
	print tag
	#print tag, sub.card(tag), full.card(tag), float(sub.card(tag)) / float(full.card(tag))