~ubuntu-branches/ubuntu/utopic/bauble/utopic

Viewing changes to scripts/chklist2csv.py

Committer: Bazaar Package Importer
Author(s): Alessio Treglia
Date: 2009-07-27 10:40:53 UTC
mfrom: (3.1.1 sid)
Revision ID: james.westby@ubuntu.com-20090727104053-n5ieslixn3my8fa3

Tags: 0.9.2-1ubuntu1

* Merge from debian unstable, Ubuntu remaining changes:
- Take python stuffs from /usr/local to install them into /usr, otherwise
it FTBFS.

files added:
PKG-INFO

bauble.egg-info

bauble.egg-info/PKG-INFO

bauble.egg-info/SOURCES.txt

bauble.egg-info/dependency_links.txt

bauble.egg-info/requires.txt

bauble.egg-info/top_level.txt

po/da.po

po/en_CA.po

po/eo.po

po/fr.po

po/gl.po

po/hu.po

po/it.po

po/nl.po

po/pt.po

po/ro.po

po/ru.po

po/sq.po

po/sv.po

files removed:
.emacs-prj

.pylintrc

IDEAS

bauble.sh

bauble/connmgr.glade.h

bauble/plugins/abcd/abcd_2.06.xsd

bauble/plugins/garden/acc_infobox.glade.h

bauble/plugins/garden/infoboxes.glade.h

bauble/plugins/garden/plant_infobox.glade.h

bauble/plugins/plants/editors.glade.h

bauble/plugins/plants/infoboxes.glade.h

bauble/plugins/report/default/gui.glade.h

bauble/plugins/report/report.glade.h

bauble/plugins/report/template/test.html

bauble/plugins/tag/tag.glade.h

bauble/utils/bze_checklist

doc/.static

doc/.templates

doc/Makefile

doc/api.rst

doc/conf.py

doc/editing.rst

doc/extending.rst

doc/imex.rst

doc/index.rst

doc/installing.rst

doc/intro.rst

doc/report.rst

doc/searching.rst

doc/started.rst

doc/tagging.rst

messages.pot

po/README

scripts/bauble-upgrade-0.3-to-0.4.py

scripts/bauble-upgrade-0.4-to-0.5.py

scripts/bauble-upgrade-0.5-to-0.6.py

scripts/bauble-upgrade-0.6-to-0.7.py

scripts/bauble-upgrade-0.8-to-0.9.py

scripts/bgci_csv.py

scripts/build.nsi

scripts/bump_version.py

scripts/chklist2csv.py

scripts/createdb.py

scripts/fix_geotdwg.py

scripts/gen_model_doc.py

scripts/gen_search_doc.py

scripts/i18n.sh

scripts/install_deps.py

scripts/install_gtk.py

scripts/kew2csv.py

scripts/make_ico.py

scripts/manage-gtk.py

scripts/tdgwgeo2csv.py

scripts/wgs2csv.py

test/itest.py

test/test.sh

web/images

web/images/bauble_logo.gif

web/images/bauble_logo.png

web/images/bauble_logo.svg

web/images/bauble_logo2.png

web/images/bauble_logo_old.gif

web/images/bauble_ss1_large.png

web/images/bauble_ss1_small.png

web/images/gem.svg

web/images/screenshots

web/images/screenshots/0.6

web/images/screenshots/0.6/bauble-acc-editor-coll-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-acc-editor-coll-0.6.0.png

web/images/screenshots/0.6/bauble-acc-editor-don-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-acc-editor-don-0.6.0.png

web/images/screenshots/0.6/bauble-default-formatter-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-default-formatter-0.6.0.png

web/images/screenshots/0.6/bauble-donor-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-donor-editor-0.6.0.png

web/images/screenshots/0.6/bauble-family-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-family-editor-0.6.0.png

web/images/screenshots/0.6/bauble-genus-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-genus-editor-0.6.0.png

web/images/screenshots/0.6/bauble-location-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-location-editor-0.6.0.png

web/images/screenshots/0.6/bauble-main-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-main-0.6.0.png

web/images/screenshots/0.6/bauble-pg-conn-dialog-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-pg-conn-dialog-0.6.0.png

web/images/screenshots/0.6/bauble-plant-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-plant-editor-0.6.0.png

web/images/screenshots/0.6/bauble-species-editor-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-species-editor-0.6.0.png

web/images/screenshots/0.6/bauble-sqlite-conn-dialog-0.6.0-thumb.png

web/images/screenshots/0.6/bauble-sqlite-conn-dialog-0.6.0.png

web/images/screenshots/0.7

web/images/screenshots/0.7/bauble-acc-editor-coll-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-acc-editor-coll-0.7.0.png

web/images/screenshots/0.7/bauble-acc-editor-don-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-acc-editor-don-0.7.0.png

web/images/screenshots/0.7/bauble-closed-conn-dialog-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-closed-conn-dialog-0.7.0.png

web/images/screenshots/0.7/bauble-connect-warning-0.7-thumb.png

web/images/screenshots/0.7/bauble-connect-warning-0.7.png

web/images/screenshots/0.7/bauble-create-new-0.7-thumb.png

web/images/screenshots/0.7/bauble-create-new-0.7.png

web/images/screenshots/0.7/bauble-family-editor-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-family-editor-0.7.0.png

web/images/screenshots/0.7/bauble-genus-editor-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-genus-editor-0.7.0.png

web/images/screenshots/0.7/bauble-location-editor-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-location-editor-0.7.0.png

web/images/screenshots/0.7/bauble-main-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-main-0.7.0.png

web/images/screenshots/0.7/bauble-pg-conn-dialog-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-pg-conn-dialog-0.7.0.png

web/images/screenshots/0.7/bauble-plant-editor-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-plant-editor-0.7.0.png

web/images/screenshots/0.7/bauble-species-editor-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-species-editor-0.7.0.png

web/images/screenshots/0.7/bauble-sqlite-conn-dialog-0.7.0-thumb.png

web/images/screenshots/0.7/bauble-sqlite-conn-dialog-0.7.0.png

web/images/screenshots/bauble-connect-warning-0.7-thumb.png

web/images/screenshots/bauble-connect-warning-0.7.png

web/images/screenshots/bauble-create-new-0.7-thumb.png

web/images/screenshots/bauble-create-new-0.7.png

web/index.html

web/install_linux.html

web/install_windows.html

web/news_template.html

web/screenshots.html

web/sitemap.xml

web/style.css

web/template.html

web/using.html

files modified:
bauble/__init__.py

bauble/_gui.py

bauble/connmgr.py

bauble/db.py

bauble/editor.py

bauble/i18n.py

bauble/meta.py

bauble/paths.py

bauble/pluginmgr.py

bauble/plugins/abcd/__init__.py

bauble/plugins/garden/__init__.py

bauble/plugins/garden/accession.py

bauble/plugins/garden/donor.py

bauble/plugins/garden/institution.py

bauble/plugins/garden/location.py

bauble/plugins/garden/plant.py

bauble/plugins/garden/source.py

bauble/plugins/garden/test.py

bauble/plugins/imex/__init__.py

bauble/plugins/imex/csv_.py

bauble/plugins/imex/test.py

bauble/plugins/imex/xml.py

bauble/plugins/picasa/__init__.py

bauble/plugins/picasa/test.py

bauble/plugins/plants/__init__.py

bauble/plugins/plants/family.py

bauble/plugins/plants/genus.py

bauble/plugins/plants/species.py

bauble/plugins/plants/species_editor.py

bauble/plugins/plants/species_model.py

bauble/plugins/plants/test.py

bauble/plugins/report/__init__.py

bauble/plugins/report/default/__init__.py

bauble/plugins/report/template/__init__.py

bauble/plugins/report/template/test.py

bauble/plugins/report/test.py

bauble/plugins/tag/__init__.py

bauble/prefs.py

bauble/task.py

bauble/test/__init__.py

bauble/test/test_bauble.py

bauble/test/test_meta.py

bauble/test/test_view.py

bauble/types.py

bauble/utils/__init__.py

bauble/utils/desktop.py

bauble/utils/log.py

bauble/utils/test.py

bauble/view.py

data/bauble.desktop

debian/bauble.docs

debian/changelog

debian/control

po/de.po

po/es.po

po/et.po

po/pl.po

po/pt_BR.po

po/sk.po

scripts/bauble

setup.cfg

setup.py

stdeb.cfg

Show diffs side-by-side

added added

removed removed

scripts/chklist2csv.py

#!/usr/bin/python

import sys, re, csv

data_dir = '/home/brett/devel/bauble/data/'

families_file = data_dir + 'csv/Family.txt'

genera_file = data_dir + 'csv/Genera.txt'

checklist_file = data_dir + 'old/belize_plants.txt'

species_columns='"genusID","sp","sp_author","infrasp_rank","infrasp","infrasp_author","sp_hybrid"'

# synonyms to use for the checklist genera

#generic_synonyms = {'Adenocalymna', Adenocalymma Mart. ex Meisn.

# a plant class with support for parsing a plant name string

# to contruct the object

class Plant:

def __init__(self, genus=None, species=None, infrasp_rank=None,

infrasp=None, cv=None):

self.genus = genus or ""

self.species = species or ""

self.species_author = ""

self.infrasp_rank = infrasp_rank or ""

self.infrasp_author = ""

self.infrasp = infrasp or ""

# self.cv = cv or ""

# self.is_cv = '' # HACK for this file only

self.hybrid = ''

def match(self, species):

partsList = re.split("(?:subsp\.)+|(?:var\.)+", species)

speciesPart = partsList[0].strip()

# ** match species part

# look for .sp, meaning it is not identified and should only

# set the genus

if speciesPart.find(" sp.") != -1:

self.genus = re.match("(?P<genus>[\w]*)\s+",

speciesPart).group("genus");

return

m = re.match(

"""(?P<genus>[\w]*)\s+ # match the genus

(?P<hybrid>x?)\s? # hybrid sign

(?P<species>[\w-]*)\s? # match the species

(?P<author>.*)""",

speciesPart, re.VERBOSE)

self.genus = m.group("genus")

self.species = m.group("species")

self.hybrid = m.group("hybrid")

self.species_author = m.group("author")

# check for infrasp_rank

if species.find("subsp.") != -1:

self.infrasp_rank = "subsp."

elif species.find("var.") != -1:

self.infrasp_rank = "var."

if self.infrasp_rank is not "":

infraspPart = partsList[1].strip();

m = re.match(

"""\A(?P<infrasp>[\w]*)\s?

(?P<infrasp_author>.*)""", infraspPart, re.VERBOSE)

self.infrasp = m.group("infrasp")

self.infrasp_author = m.group("infrasp_author")

# return a dict with key, value pairs for each member that has a value

# don't return key/values if the string is ""

#http://vsbabu.org/mt/archives/2003/02/13/joy_of_python_classes_and_dictionaries.html

#return dict([(k, v) for (k, v) in o.__dict__.items if not k.startswith('_'+o.__class__.__name__)])

# TODO: i'm not sure if this works

def dict(self):

"""Return a dictionary from object that has public

variable -> key pairs

"""

dict = {}

#Joy: all the attributes in a class are already in __dict__

privatePrefix = "_" + self.__class__.__name__

for elem in self.__dict__.keys():

if elem.find(privatePrefix) == 0:

continue

#We discard private variables, which are automatically

#named _ClassName__variablename, when we define it in

#the class as __variablename

elif self.__dict__[elem] != "":

try:

#dict[elem] = self.__dict__[elem].encode("latin-1")

dict[elem] = self.__dict__[elem]

except:

print dict[elem]

#dict[elem] = str(self.__dict__[elem]).encode("latin-1")

return dict

def __str__(self):

s = self.genus

if self.hybrid:

s += " " + "x"

100

if self.species is not None:

101

s += " " + self.species

102

else: s += " sp."

103

if self.infrasp_rank is not None:

104

s += " " + self.infrasp_rank + " " + self.infrasp

105

# if self.cv is not None:

106

# s += " " + self.cv

107

108

return s.strip()

109

110

# should be able to set field separator, field encloser, and some fields

111

# should be options like family, authors, hyrbid, etc..

112

def csv(self, with_family=False):

113

"""

114

print out in comma separated values format with the following fields:

115

genus, species, species_author, infrasp_rank, infrasp, infrasp_author, cv, hybrid

116

"""

117

csv = ""

118

ft = "," # field terminated

119

enclosed = '"' # field enclosed

120

field = lambda x: '%s%s%s' % (enclosed, x, enclosed)

121

if with_family is True:

122

csvStr += field(self.family) + ft

123

if isinstance(self.genus, int):

124

csv += str(self.genus) + ft

125

else: csv+= field(self.genus) + ft

126

127

try:

128

csv += field(self.species) + ft + \

129

field(self.species_author) + ft + \

130

field(self.infrasp_rank) + ft + \

131

field(self.infrasp) + ft + field(self.infrasp_author)

132

except UnicodeDecodeError, e:

133

print sys.stderr.write(e)

134

raise

135

136

# there are no cultivars in the belize checklist

137

# if self.cv is not "":

138

# csv += ft + field(" cv. " + self.cv)

139

# else:

140

# csv += ft+ field('') + ft

141

csv += ft + field(self.hybrid)

142

#if self.hybrid is not '':

143

# csv += ft + 'True'

144

#else:

145

# csv += ft

146

return csv

147

# end Plant class

148

149

150

###################################################

151

152

153

# first parse the kew_genera.txt file for the genus id->name map,

154

# TODO: there is one genus in the file that has a duplicate name, find it

155

# and make sure that we don't use it in the checklist

156

gen_dict = {}

157

missing = {}

158

bad_lines = []

159

160

for line in csv.reader(open(genera_file)):

161

gen_dict[line[2]] = line[0]

162

163

# print out a first line since it will be skipped

164

print plantname_columns

165

family = None

166

for line in open(checklist_file).readlines():

167

line = line.strip()

168

if line == "": continue

169

cultivated = "n"

170

if line.find(" ") == -1 or line.find(":") != -1:

171

family = line

172

continue

173

elif line.startswith('*'):

174

cultivated = "y"

175

line = line[1:]

176

#continue # ******************* for now skip cultivated material

177

p = Plant()

178

p.match(line)

179

180

if p.genus not in gen_dict:

181

if p.genus not in missing:

182

missing[p.genus] = []

183

missing[p.genus].append(str(p))

184

elif p.species == "":

185

bad_lines.append(line)

186

continue # skip Prescottia sp. style names

187

else:

188

p.genus = int(gen_dict[p.genus])

189

print p.csv()

190

191

192

if len(missing) > 0:

193

sys.stderr.write("******* could not find the following genera *******\n")

194

for gen, sp in missing.iteritems():

195

sys.stderr.write('%s: %s\n' % (gen, sp))

196

197

198

if len(bad_lines) > 0:

199

sys.stderr.write('******* could do anything with the following lines: *******\n')

200

for b in bad_lines:

201

sys.stderr.write(b + '\n')

202

#print b

203

204

205

Older »