~ubuntu-branches/ubuntu/natty/pytables/natty-updates

Committer: Bazaar Package Importer
Author(s): Alexandre Fayolle
Date: 2006-06-28 10:45:03 UTC
mfrom: (1.2.1 upstream)
mto: This revision was merged to the branch mainline in revision 5.
Revision ID: james.westby@ubuntu.com-20060628104503-cc251q5o5j3e2k10

  * Fixed call to pyversions in debian/rules which failed on recent versions
    of pyversions
  * Fixed clean rule in debian/rules which left the stamp files behind
  * Acknowledge NMU
  * Added Alexandre Fayolle to uploaders

files added:
ANNOUNCE.txt.in

LICENSE.txt

LICENSES

LICENSES/HDF5.txt

LICENSES/LRUCACHE.txt

Makefile

RELEASE-NOTES.txt.in

VERSION

bench/LRU-experiments.py

bench/LRU-experiments2.py

bench/NetCDF-bench.py

bench/create-large-number-objects.py

bench/indexed_search.py

bench/open_close-bench-gzip.h5

bench/open_close-bench.py

bench/open_close-bench2.py

bench/plot-bar.py

bench/postgres-search-bench.py

bench/postgres_backend.py

bench/pytables-search-bench.py

bench/pytables_backend.py

bench/search-bench-plot.py

bench/sqlite3-search-bench.py

bench/undo_redo.py

bench/undo_redo.txt

contrib/h5_dap_plugin.py

debian/control.meu

debian/pycompat

debian/rules.meu

doc/Makefile

doc/html/a6585.html

doc/html/a6736.html

doc/html/a6829.html

doc/html/a6969.html

doc/html/c1381.html

doc/html/c227.html

doc/html/c38.html

doc/html/c514.html

doc/html/c5270.html

doc/html/c5708.html

doc/html/c6061.html

doc/html/compressed-recordsize-shuffle.png

doc/html/compressed-recordsize-zlib.png

doc/html/compressed-recordsize.png

doc/html/compressed-select-cache-shuffle-only.png

doc/html/compressed-select-cache-shuffle.png

doc/html/compressed-select-cache-zlib.png

doc/html/compressed-select-cache.png

doc/html/compressed-select-nocache-shuffle-only.png

doc/html/compressed-select-nocache-shuffle.png

doc/html/compressed-select-nocache.png

doc/html/compressed-writing-shuffle-only.png

doc/html/compressed-writing-shuffle.png

doc/html/compressed-writing-zlib.png

doc/html/compressed-writing.png

doc/html/index.html

doc/html/indexTimes-itanium.png

doc/html/logo3-ombra.png

doc/html/objecttree-h5.png

doc/html/objecttree.png

doc/html/p35.html

doc/html/p5706.html

doc/html/p6583.html

doc/html/read-medium-psyco-nopsyco-comparison.png

doc/html/rootUEP1.png

doc/html/rootUEP2.png

doc/html/searchTimes-float-itanium.png

doc/html/searchTimes-int-itanium.png

doc/html/searchTimes.png

doc/html/tutorial1-1-tableview.png

doc/html/tutorial1-2-tableview.png

doc/html/tutorial1-general.png

doc/html/tutorial2-tableview.png

doc/html/write-medium-psyco-nopsyco-comparison.png

doc/html/x1017.html

doc/html/x1085.html

doc/html/x1185.html

doc/html/x1268.html

doc/html/x1376.html

doc/html/x142.html

doc/html/x1533.html

doc/html/x2341.html

doc/html/x2546.html

doc/html/x2806.html

doc/html/x2981.html

doc/html/x3528.html

doc/html/x3623.html

doc/html/x3737.html

doc/html/x3869.html

doc/html/x4041.html

doc/html/x4072.html

doc/html/x4133.html

doc/html/x4290.html

doc/html/x4306.html

doc/html/x4389.html

doc/html/x457.html

doc/html/x4983.html

doc/html/x5297.html

doc/html/x5412.html

doc/html/x5502.html

doc/html/x5552.html

doc/html/x5576.html

doc/html/x5654.html

doc/html/x5689.html

doc/html/x5744.html

doc/html/x5755.html

doc/html/x5875.html

doc/html/x5885.html

doc/html/x5902.html

doc/html/x6072.html

doc/html/x6243.html

doc/html/x6437.html

doc/html/x6471.html

doc/html/x6480.html

doc/html/x6497.html

doc/html/x6782.html

doc/html/x6812.html

doc/html/x6885.html

doc/html/x6938.html

doc/html/x7025.html

doc/html/x7045.html

doc/html/x762.html

doc/html/x921.html

doc/scripts/filenode.py

doc/scripts/pickletrouble.py

doc/text

doc/text/nestedrecords.txt

doc/xml/Makefile

doc/xml/compressed-recordsize-shuffle.pdf

doc/xml/compressed-recordsize-zlib.pdf

doc/xml/compressed-recordsize.pdf

doc/xml/compressed-select-cache-shuffle-only.pdf

doc/xml/compressed-select-cache-shuffle.pdf

doc/xml/compressed-select-cache-zlib.pdf

doc/xml/compressed-select-cache.pdf

doc/xml/compressed-select-nocache-shuffle-only.pdf

doc/xml/compressed-select-nocache-shuffle.pdf

doc/xml/compressed-select-nocache.pdf

doc/xml/compressed-writing-shuffle-only.pdf

doc/xml/compressed-writing-shuffle.pdf

doc/xml/compressed-writing-zlib.pdf

doc/xml/compressed-writing.pdf

doc/xml/indexTimes-itanium.pdf

doc/xml/logo3-ombra.png

doc/xml/objecttree-h5.png

doc/xml/objecttree.dia

doc/xml/read-medium-psyco-nopsyco-comparison.pdf

doc/xml/rootUEP1.fig

doc/xml/rootUEP2.fig

doc/xml/searchTimes-float-itanium.pdf

doc/xml/searchTimes-int-itanium.pdf

doc/xml/searchTimes.pdf

doc/xml/strip-dbmanual.py

doc/xml/tutorial1-1-tableview.png

doc/xml/tutorial1-2-tableview.png

doc/xml/tutorial1-general.png

doc/xml/tutorial2-tableview.png

doc/xml/write-medium-psyco-nopsyco-comparison.pdf

examples/add-column.py

examples/carray1.py

examples/enum.py

examples/nested-iter.py

examples/nested-tut.py

examples/nested1.py

examples/netCDF_example.py

examples/tutorial3-1.py

examples/tutorial3-2.py

examples/undo-redo.py

src/H5ATTR.c

src/H5ATTR.h

src/H5Zbzip2.c

src/H5Zbzip2.h

src/Makefile

src/TableExtension.c

src/TableExtension.pyx

src/_comp_bzip2.c

src/_comp_bzip2.pyx

src/_comp_lzo.c

src/_comp_lzo.pyx

src/_comp_ucl.c

src/_comp_ucl.pyx

src/definitions.pxd

src/typeconv.c

src/typeconv.h

src/utilsExtension.c

src/utilsExtension.pyx

src/version.h.in

tables/Atom.py

tables/CArray.py

tables/NetCDF.py

tables/Node.py

tables/attributeaccess.py

tables/constants.py

tables/enum.py

tables/exceptions.py

tables/lrucache.py

tables/nestedrecords.py

tables/nriterators.py

tables/proxydict.py

tables/registry.py

tables/scripts

tables/scripts/__init__.py

tables/scripts/nctoh5.py

tables/scripts/ptdump.py

tables/scripts/ptrepack.py

tables/tests

tables/tests/Table1_0_ucl_nrv2e.h5

tables/tests/Table2_0_ucl_nrv2d.h5

tables/tests/Table2_1_lzo_nrv2e_shuffle.h5

tables/tests/Tables_lzo1.h5

tables/tests/Tables_lzo1_shuffle.h5

tables/tests/Tables_lzo2.h5

tables/tests/Tables_lzo2_shuffle.h5

tables/tests/__init__.py

tables/tests/check_leaks.py

tables/tests/common.py

tables/tests/ex-noattr.h5

tables/tests/flavored_vlarrays-pre1.6.h5

tables/tests/non-chunked-table.h5

tables/tests/smpl_SDSextendible.h5

tables/tests/smpl_compound_chunked.h5

tables/tests/smpl_enum.h5

tables/tests/smpl_f64be.h5

tables/tests/smpl_f64le.h5

tables/tests/smpl_i32be.h5

tables/tests/smpl_i32le.h5

tables/tests/smpl_i64be.h5

tables/tests/smpl_i64le.h5

tables/tests/smpl_unsupptype.h5

tables/tests/test_NetCDF.py

tables/tests/test_Numeric.py

tables/tests/test_all.py

tables/tests/test_array.py

tables/tests/test_attributes.py

tables/tests/test_backcompat.py

tables/tests/test_basics.py

tables/tests/test_carray.py

tables/tests/test_create.py

tables/tests/test_do_undo.py

tables/tests/test_earray.py

tables/tests/test_enum.py

tables/tests/test_filenode.dat

tables/tests/test_filenode.py

tables/tests/test_filenode.xbm

tables/tests/test_filenode_v1.h5

tables/tests/test_garbage.py

tables/tests/test_hdf5compat.py

tables/tests/test_indexes.py

tables/tests/test_indexvalues.py

tables/tests/test_lists.py

tables/tests/test_nestedrecords.py

tables/tests/test_nestedtypes.py

tables/tests/test_nriterators.py

tables/tests/test_numpy.py

tables/tests/test_tables.py

tables/tests/test_tablesMD.py

tables/tests/test_timetype.py

tables/tests/test_tree.py

tables/tests/test_types.py

tables/tests/test_vlarray.py

tables/tests/zerodim-attrs-1.3.h5

tables/tests/zerodim-attrs-1.4.h5

tables/undoredo.py

files removed:
LICENSE

doc/html/generahtml.sh

doc/html/html.css

doc/html/indexTimes-itanium-web.png

doc/html/makebib

doc/html/makeclean

doc/html/makeepss

doc/html/makeeqns

doc/html/makeidx

doc/html/makepage

doc/html/makepdfs

doc/html/makewebs

doc/html/objecttree-h5-web.jpg

doc/html/objecttree-h5.jpg

doc/html/objecttree-web.png

doc/html/paperbk4.jpg

doc/html/pretty.jpg

doc/html/read-medium-lzo-zlib-ucl-comparison-web.png

doc/html/read-medium-psyco-lzo-comparison-web.png

doc/html/read-medium-psyco-lzo-zlib-ucl-comparison-web.png

doc/html/read-medium-psyco-nopsyco-comparison-web.png

doc/html/rootUEP1-web.png

doc/html/rootUEP2-web.png

doc/html/searchTimes-float-itanium-web.png

doc/html/searchTimes-int-itanium-web.png

doc/html/tile.jpg

doc/html/tutorial1-general-web.jpg

doc/html/tutorial1-general.jpg

doc/html/tutorial1-tableview-web.jpg

doc/html/tutorial1-tableview.jpg

doc/html/tutorial2-tableview-web.jpg

doc/html/tutorial2-tableview.jpg

doc/html/usersguide.bib

doc/html/usersguide.html

doc/html/usersguide1.html

doc/html/usersguide2.html

doc/html/usersguide3.html

doc/html/usersguide4.html

doc/html/usersguide5.html

doc/html/usersguide6.html

doc/html/usersguide7.html

doc/html/usersguide8.html

doc/html/usersguide9.html

doc/html/write-medium-lzo-zlib-ucl-comparison-web.png

doc/html/write-medium-psyco-lzo-comparison-web.png

doc/html/write-medium-psyco-lzo-zlib-ucl-comparison-web.png

doc/html/write-medium-psyco-nopsyco-comparison-web.png

doc/objecttree.dia

doc/rootUEP1.fig

doc/rootUEP2.fig

doc/xml/indexTimes-itanium.eps

doc/xml/logo3-ombra.jpg

doc/xml/logo4-ombra.jpg

doc/xml/objecttree-h5.jpg

doc/xml/objecttree.eps

doc/xml/read-medium-lzo-zlib-ucl-comparison.eps

doc/xml/read-medium-psyco-lzo-zlib-ucl-comparison.eps

doc/xml/read-medium-psyco-nopsyco-comparison.eps

doc/xml/rootUEP1.eps

doc/xml/rootUEP2.eps

doc/xml/searchTimes-float-itanium.eps

doc/xml/searchTimes-int-itanium.eps

doc/xml/searchTimes.eps

doc/xml/tutorial1-general.jpg

doc/xml/tutorial1-tableview.jpg

doc/xml/tutorial2-tableview.jpg

doc/xml/write-medium-lzo-zlib-ucl-comparison.eps

doc/xml/write-medium-psyco-lzo-zlib-ucl-comparison.eps

doc/xml/write-medium-psyco-nopsyco-comparison.eps

src/H5LT.c

src/H5LT.h

src/H5TB.c

src/H5TB.h

src/calcoffset.c

src/calcoffset.h

src/getfieldfmt.c

src/getfieldfmt.h

src/type-longlong.h

test

test/Table1_0_ucl_nrv2e.h5

test/Table2_0_ucl_nrv2d.h5

test/Table2_1_ucl_nrv2e_shuffle.h5

test/ex-noattr.h5

test/test_Numeric.py

test/test_all.py

test/test_backcompat.py

test/test_basics.py

test/test_create.py

test/test_earray.py

test/test_filenode.dat

test/test_filenode.py

test/test_filenode.xbm

test/test_indexes.py

test/test_indexvalues.py

test/test_lists.py

test/test_numarray.py

test/test_tables.py

test/test_tablesMD.py

test/test_tree.py

test/test_types.py

test/test_vlarray.py

files modified:
ANNOUNCE.txt

MANIFEST.in

README.txt

RELEASE-NOTES.txt

THANKS

TODO.txt

bench/bsddb-table-bench.py

bench/cacheout.py

bench/copy-bench.py

bench/opteron-stress-test.txt

bench/recarray2-test.py

bench/search-bench.py

bench/searchsorted-bench.py

bench/searchsorted-bench2.py

bench/shelve-bench.py

bench/sqlite-search-bench.py

bench/stress-test.py

bench/stress-test2.py

bench/stress-test3.py

bench/table-bench.py

bench/table-bench2.py

bench/widetree.py

bench/widetree2.py

contrib/README

contrib/make_hdf.py

debian/README.Debian

debian/changelog

debian/control

debian/copyright

debian/nctoh5.1

debian/ptdump.1

debian/ptrepack.1

debian/rules

doc/usersguide.pdf

doc/xml/usersguide.bib

doc/xml/usersguide.xml

examples/array1.py

examples/check_examples.sh

examples/earray1.py

examples/filenodes1.py

examples/gl-test.py

examples/objecttree.py

examples/table-tree.py

examples/table1.py

examples/table3.py

examples/tutorial1-1.py

examples/tutorial1-2.py

examples/tutorial2.py

examples/vlarray1.py

examples/vlarray2.py

examples/vlarray3.py

setup.cfg

setup.py

src/H5ARRAY-opt.c

src/H5ARRAY-opt.h

src/H5ARRAY.c

src/H5ARRAY.h

src/H5TB-opt.c

src/H5TB-opt.h

src/H5VLARRAY.c

src/H5VLARRAY.h

src/H5Zlzo.c

src/H5Zlzo.h

src/H5Zucl.c

src/H5Zucl.h

src/arraytypes.c

src/hdf5Extension.c

src/hdf5Extension.pyx

src/tables.h

src/utils.c

src/utils.h

src/version.h

tables/Array.py

tables/AttributeSet.py

tables/EArray.py

tables/File.py

tables/Group.py

tables/Index.py

tables/IndexArray.py

tables/IsDescription.py

tables/Leaf.py

tables/Table.py

tables/UnImplemented.py

tables/VLArray.py

tables/__init__.py

tables/nodes/FileNode.py

tables/nodes/__init__.py

tables/utils.py

utils/nctoh5

utils/ptdump

utils/ptrepack

Show diffs side-by-side

added added

removed removed

tables/NetCDF.py

"""

PyTables NetCDF version 3 emulation API.

This module provides an API is nearly identical to Scientific.IO.NetCDF

(http://starship.python.net/~hinsen/ScientificPython/ScientificPythonManual/Scientific.html).

Some key differences between the Scientific.IO.NetCDF API and the pytables

NetCDF emulation API to keep in mind are:

1) data is stored in an HDF5 file instead of a netCDF file.

2) Although each variable can have only one unlimited

dimension, it need not be the first as in a true NetCDF file.

Complex data types 'F' (Complex32) and 'D' (Complex64) are supported

in tables.NetCDF, but are not supported in netCDF

(or Scientific.IO.NetCDF). Files with variables that have

these datatypes, or an unlimited dimension other than the first,

cannot be converted to netCDF using h5tonc.

3) variables are compressed on disk by default using

HDF5 zlib compression with the 'shuffle' filter.

If the 'least_significant_digit' keyword is used when a

variable is created with the createVariable method, data will be

truncated (quantized) before being written to the file.

This can significantly improve compression. For example, if

least_significant_digit=1, data will be quantized using

numarray.around(scale*data)/scale, where scale = 2**bits, and

bits is determined so that a precision of 0.1 is retained (in

this case bits=4).

From http://www.cdc.noaa.gov/cdc/conventions/cdc_netcdf_standard.shtml:

"least_significant_digit -- power of ten of the smallest decimal

place in unpacked data that is a reliable value."

4) data must be appended to a variable with an unlimited

dimension using the 'append' method of the netCDF

variable object. In Scientific.IO.NetCDF, data can be added

along an unlimited dimension by assigning it to a slice (there

is no append method).

The 'sync' method synchronizes the size

of all variables with an unlimited dimension by filling in

data using the default netCDF _FillValue, and

is invoked automatically when the NetCDFFile object is closed.

In the Scientific.IO.NetCDF, the 'sync' method flushes the data to disk.

5) the createVariable method has three extra optional keyword

arguments not found in the Scientific.IO.NetCDF interface,

'least_significant_digit' (see item (2) above), 'expectedsize'

and 'filters'.

The 'expectedsize' keyword applies only to variables with an

unlimited dimension, and is an estimate of the number

of entries that will be added along that dimension

(default 1000). This estimate is used to optimize

HDF5 file access and memory usage.

The 'filters' keyword is a PyTables filters instance

that describes how to store the data on disk.

The default corresponds to complevel=6, complib='zlib',

shuffle=1 and fletcher32=0.

6) data can be saved to a real netCDF file using the NetCDFFile class

method 'h5tonc' (if Scientific.IO.NetCDF is installed). The

unlimited dimension must be the first (for all variables in the file)

in order to use the 'h5tonc' method.

Data can also be imported from a true netCDF file and saved

in an HDF5 file using the 'nctoh5' class method.

7) A list of attributes corresponding to global netCDF attributes

defined in the file can be obtained with the NetCDFFile ncattrs method.

Similarly, netCDF variable attributes can be obtained with

the NetCDFVariable ncattrs method.

8) you should not define global or variable attributes that start

with '_NetCDF_', those names are reserved for internal use.

9) output similar to 'ncdump -h' can be obtained by simply

printing the NetCDFFile instance.

A tables.NetCDF file consists of array objects (either EArrays or

CArrays) located in the root group of a pytables hdf5 file. Each of

the array objects must have a dimensions attribute, consisting of a

tuple of dimension names (the length of this tuple should be the same

as the rank of the array object). Any such objects with one

of the supported data types in a pytables file that conforms to

this simple structure can be read with the tables.NetCDF module.

Note: This module does not yet create HDF5 files that are compatible

with netCDF version 4.

Datasets created with the PyTables netCDF emulation API can be shared

over the internet with the OPeNDAP protocol (http://opendap.org), via

the python opendap module (http://opendap.oceanografia.org). A plugin

for the python opendap server is included with the pytables

distribution (contrib/h5_dap_plugin.py). Simply copy that file into

the 'plugins' directory of the opendap python module source

distribution, run 'setup.py install', point the opendap server to the

directory containing your hdf5 files, and away you go. Any OPeNDAP

aware client (such as Matlab or IDL) can now access your data over

http as if it were a local disk file.

Jeffrey Whitaker <jeffrey.s.whitaker@noaa.gov>

Version: 20051110

"""

__version__ = '20051110'

import math, tables, numarray

# need Numeric for h5 <--> netCDF conversion.

Numeric_imported = True

try:

100

import Numeric

101

except:

102

Numeric_imported = False

103

# need Scientific to convert to/from real netCDF files.

104

ScientificIONetCDF_imported = True

105

try:

106

import Scientific.IO.NetCDF as RealNetCDF

107

except:

108

ScientificIONetCDF_imported = False

109

110

# dictionary that maps pytables types to single-character Numeric typecodes.

111

_typecode_dict = {'Float64':'d',

112

'Float32':'f',

113

'Int32':'i',

114

'Int16':'s',

115

'Int8':'1',

116

'CharType':'c',

117

'Complex32':'F',

118

'Complex64':'D',

119

}

120

121

# dictionary that maps single character Numeric typecodes to netCDF

122

# data types (False if no corresponding netCDF datatype exists).

123

_netcdftype_dict = {'s':'short','1':'byte','l':'int','i':'int',

124

'f':'float','d':'double','c':'character','F':False,'D':False}

125

# values to print out in __repr__ method.

126

_reprtype_dict = {'s':'short','1':'byte','l':'int','i':'int',

127

'f':'float','d':'double','c':'character','F':'complex','D':'double_complex'}

128

129

# _NetCDF_FillValue defaults taken netCDF 3.6.1 header file.

130

_fillvalue_dict = {'f': 9.9692099683868690e+36,

131

'd': 9.9692099683868690e+36, # near 15 * 2^119

132

'F': 9.9692099683868690e+36+0j, # next two I made up

133

'D': 9.9692099683868690e+36+0j, # (no Complex in netCDF)

134

'i': -2147483647,

135

'l': -2147483647,

136

's': -32767,

137

'1': -127, # (signed char)-127

138

'c': chr(0)} # (char)0

139

140

def _quantize(data,least_significant_digit):

141

"""quantize data to improve compression.

142

data is quantized using around(scale*data)/scale,

143

where scale is 2**bits, and bits is determined from

144

the least_significant_digit.

145

For example, if least_significant_digit=1, bits will be 4."""

146

precision = 10.**-least_significant_digit

147

exp = math.log(precision,10)

148

if exp < 0:

149

exp = int(math.floor(exp))

150

else:

151

exp = int(math.ceil(exp))

152

bits = math.ceil(math.log(10.**-exp,2))

153

scale = 2.**bits

154

return numarray.around(scale*data)/scale

155

156

class NetCDFFile:

157

"""

158

netCDF file Constructor: NetCDFFile(filename, mode="r",history=None)

159

160

Arguments:

161

162

filename -- Name of hdf5 file to hold data.

163

164

mode -- access mode. "r" means read-only; no data can be modified.

165

"w" means write; a new file is created, an existing

166

file with the same name is deleted. "a" means append

167

(in analogy with serial files); an existing file is

168

opened for reading and writing.

169

170

history -- a string that is used to define the global NetCDF

171

attribute 'history'.

172

173

A NetCDFFile object has two standard attributes: 'dimensions' and

174

'variables'. The values of both are dictionaries, mapping

175

dimension names to their associated lengths and variable names to

176

variables, respectively. Application programs should never modify

177

these dictionaries.

178

179

A list of attributes corresponding to global netCDF attributes

180

defined in the file can be obtained with the ncattrs method.

181

Global file attributes are created by assigning to an attribute of

182

the NetCDFFile object.

183

"""

184

185

def __init__(self,filename,mode='r',history=None):

186

# open an hdf5 file.

187

self._NetCDF_h5file = tables.openFile(filename, mode=mode)

188

self._NetCDF_mode = mode

189

# file already exists, set up variable and dimension dicts.

190

if mode != 'w':

191

self.dimensions = {}

192

self.variables = {}

193

for var in self._NetCDF_h5file.root:

194

if not isinstance(var,tables.CArray) and not isinstance(var,tables.EArray):

195

print 'object',var,'is not a EArray or CArray, skipping ..'

196

continue

197

if var.stype not in _typecode_dict.keys():

198

print 'object',var.name,'is not a supported datatype (',var.stype,'), skipping ..'

199

continue

200

if var.attrs.__dict__.has_key('dimensions'):

201

n = 0

202

for dim in var.attrs.__dict__['dimensions']:

203

if var.extdim >= 0 and n == var.extdim:

204

val=None

205

else:

206

val=int(var.shape[n])

207

if not self.dimensions.has_key(dim):

208

self.dimensions[dim] = val

209

else:

210

# raise an exception of a dimension of that

211

# name has already been encountered with a

212

# different value.

213

if self.dimensions[dim] != val:

214

raise KeyError,'dimension lengths not consistent'

215

n = n + 1

216

else:

217

print 'object',var.name,'does not have a dimensions attribute, skipping ..'

218

continue

219

self.variables[var.name]=_NetCDFVariable(var,self)

220

if len(self.variables.keys()) == 0:

221

raise IOError, 'file does not contain any objects compatible with tables.NetCDF'

222

else:

223

# initialize dimension and variable dictionaries for a new file.

224

self.dimensions = {}

225

self.variables = {}

226

# set history attribute.

227

if mode != 'r':

228

if history != None:

229

self.history = history

230

231

def createDimension(self,dimname,size):

232

"""Creates a new dimension with the given "dimname" and

233

"size". "size" must be a positive integer or 'None',

234

which stands for the unlimited dimension. There can

235

be only one unlimited dimension per dataset."""

236

self.dimensions[dimname] = size

237

# make sure there is only one unlimited dimension.

238

if self.dimensions.values().count(None) > 1:

239

raise ValueError, 'only one unlimited dimension allowed!'

240

241

def createVariable(self,varname,datatype,dimensions,least_significant_digit=None,expectedsize=1000,filters=None):

242

"""Creates a new variable with the given "varname", "datatype", and

243

"dimensions". The "datatype" is a one-letter string with the same

244

meaning as the typecodes for arrays in module Numeric; in

245

practice the predefined type constants from Numeric should

246

be used. "dimensions" must be a tuple containing dimension

247

names (strings) that have been defined previously.

248

The unlimited dimension must be the first (leftmost)

249

dimension of the variable.

250

251

If the optional keyword parameter 'least_significant_digit' is

252

specified, multidimensional variables will be truncated

253

(quantized). This can significantly improve compression. For

254

example, if least_significant_digit=1, data will be quantized

255

using Numeric.around(scale*data)/scale, where scale = 2**bits,

256

and bits is determined so that a precision of 0.1 is retained

257

(in this case bits=4).

258

From http://www.cdc.noaa.gov/cdc/conventions/cdc_netcdf_standard.shtml:

259

"least_significant_digit -- power of ten of the smallest decimal

260

place in unpacked data that is a reliable value."

261

262

The 'expectedsize' keyword applies only to variables with an

263

unlimited dimension - it is the expected number of entries

264

that will be added along the unlimited dimension (default

265

1000). If think the actual number of entries will be an order

266

of magnitude different than the default, consider providing a

267

guess; this will optimize the HDF5 B-Tree creation, management

268

process time, and memory usage.

269

270

The 'filters' keyword also applies only to variables with

271

an unlimited dimension, and is a PyTables filters instance

272

that describes how to store an enlargeable array on disk.

273

The default is tables.Filters(complevel=6, complib='zlib',

274

shuffle=1, fletcher32=0).

275

276

The return value is the NetCDFVariable object describing the

277

new variable."""

278

# create NetCDFVariable instance.

279

var = NetCDFVariable(varname,self,datatype,dimensions,least_significant_digit=least_significant_digit,expectedsize=expectedsize,filters=filters)

280

# update shelf variable dictionary, global variable

281

# info dict.

282

self.variables[varname] = var

283

return var

284

285

def close(self):

286

"""Closes the file (after calling the sync method)"""

287

self.sync()

288

self._NetCDF_h5file.close()

289

290

def sync(self):

291

"""

292

synchronize variables along unlimited dimension, filling in data

293

with default netCDF _FillValue. Returns the length of the

294

unlimited dimension. Invoked automatically when the NetCDFFile

295

object is closed.

296

"""

297

# find max length of unlimited dimension.

298

len_unlim_dims = []

299

hasunlimdim = False

300

for varname,var in self.variables.iteritems():

301

if var.extdim >= 0:

302

hasunlimdim = True

303

len_unlim_dims.append(var.shape[var.extdim])

304

if not hasunlimdim:

305

return 0

306

len_max = max(len_unlim_dims)

307

if self._NetCDF_mode == 'r':

308

return len_max # just returns max length of unlim dim if read-only

309

# fill in variables that have an unlimited

310

# dimension with _FillValue if they have fewer

311

# entries along unlimited dimension than the max.

312

for varname,var in self.variables.iteritems():

313

len_var = var.shape[var.extdim]

314

if var.extdim >= 0 and len_var < len_max:

315

shp = list(var.shape)

316

shp[var.extdim]=len_max-len_var

317

var._NetCDF_varobj.append(var._NetCDF_FillValue*numarray.ones(shp,var.typecode()))

318

return len_max

319

320

def __repr__(self):

321

"""produces output similar to 'ncdump -h'."""

322

info=[self._NetCDF_h5file.filename+' {\n']

323

info.append('dimensions:\n')

324

n = 0

325

len_unlim = int(self.sync())

326

for key,val in self.dimensions.iteritems():

327

if val == None:

328

size = len_unlim

329

info.append(' '+key+' = UNLIMITED ; // ('+repr(size)+' currently)\n')

330

else:

331

info.append(' '+key+' = '+repr(val)+' ;\n')

332

n = n + 1

333

info.append('variables:\n')

334

for varname in self.variables.keys():

335

var = self.variables[varname]

336

dim = var.dimensions

337

type = _reprtype_dict[var.typecode()]

338

info.append(' '+type+' '+varname+str(dim)+' ;\n')

339

for key in var.ncattrs():

340

val = getattr(var,key)

341

info.append(' '+varname+':'+key+' = '+repr(val)+' ;\n')

342

info.append('// global attributes:\n')

343

for key in self.ncattrs():

344

val = getattr(self,key)

345

info.append(' :'+key+' = '+repr(val)+' ;\n')

346

info.append('}')

347

return ''.join(info)

348

349

def __setattr__(self,name,value):

350

# if name = 'dimensions', 'variables', or begins with

351

# '_NetCDF_', it is a temporary at the python level

352

# (not stored in the hdf5 file).

353

if not name.startswith('_') and name not in ['dimensions','variables']:

354

setattr(self._NetCDF_h5file.root._v_attrs,name,value)

355

elif not name.endswith('__'):

356

self.__dict__[name]=value

357

358

def __getattr__(self,name):

359

if name.startswith('__') and name.endswith('__'):

360

raise AttributeError

361

elif name.startswith('_NetCDF_') or name in ['dimensions','variables']:

362

return self.__dict__[name]

363

else:

364

if self.__dict__.has_key(name):

365

return self.__dict__[name]

366

else:

367

return self._NetCDF_h5file.root._v_attrs.__dict__[name]

368

369

def ncattrs(self):

370

"""return attributes corresponding to netCDF file attributes"""

371

return [attr for attr in self._NetCDF_h5file.root._v_attrs._v_attrnamesuser]

372

373

def h5tonc(self,filename,packshort=False,scale_factor=None,add_offset=None):

374

"""convert to a true netcdf file (filename). Requires

375

Scientific.IO.NetCDF module. If packshort=True, variables are

376

packed as short integers using the dictionaries scale_factor

377

and add_offset. The dictionary keys are the the variable names

378

in the hdf5 file to be packed as short integers. Each

379

variable's unlimited dimension must be the slowest varying

380

(the first dimension for C/Python, the last for Fortran)."""

381

382

if not ScientificIONetCDF_imported or not Numeric_imported:

383

print 'Scientific.IO.NetCDF and Numeric must be installed to convert to NetCDF'

384

return

385

ncfile = RealNetCDF.NetCDFFile(filename,'w')

386

# create dimensions.

387

for dimname,size in self.dimensions.iteritems():

388

ncfile.createDimension(dimname,size)

389

# create global attributes.

390

for key in self.ncattrs():

391

setattr(ncfile,key,getattr(self,key))

392

# create variables.

393

for varname,varin in self.variables.iteritems():

394

packvar = False

395

dims = varin.dimensions

396

dimsizes = [self.dimensions[dim] for dim in dims]

397

if None in dimsizes:

398

if dimsizes.index(None) != 0:

399

raise ValueError,'unlimited or enlargeable dimension must be most significant (slowest changing, or first) one in order to convert to a true netCDF file'

400

if packshort and scale_factor.has_key(varname) and add_offset.has_key(varname):

401

print 'packing %s as short integers ...'%(varname)

402

datatype = 's'

403

packvar = True

404

else:

405

datatype = varin.typecode()

406

if not _netcdftype_dict[datatype]:

407

raise ValueError,'datatype not supported in netCDF, cannot convert to a true netCDF file'

408

409

varout = ncfile.createVariable(varname,datatype,dims)

410

for key in varin.ncattrs():

411

setattr(varout,key,getattr(varin,key))

412

if packvar:

413

setattr(varout,'scale_factor',scale_factor[varname])

414

setattr(varout,'add_offset',add_offset[varname])

415

for n in range(varin.shape[0]):

416

if packvar:

417

varout[n] = ((1./scale_factor[varname])*(varin[n] - add_offset[varname])).astype('s')

418

else:

419

if datatype == 'c':

420

varout[n] = Numeric.reshape(Numeric.array(varin[n].flat,'c'),varin.shape[1:])

421

else:

422

varout[n] = varin[n]

423

# close file.

424

ncfile.close()

425

426

def nctoh5(self,filename,unpackshort=True,filters=None):

427

"""convert a true netcdf file (filename) to a hdf5 file

428

compatible with this module. Requires Scientific.IO.NetCDF

429

module. If unpackshort=True, variables stored as short

430

integers with a scale and offset are unpacked to Float32

431

variables in the hdf5 file. If the least_significant_digit

432

attribute is set, the data is quantized to improve

433

compression. Use the filters keyword to change the default

434

tables.Filters instance used for compression (see the

435

createVariable docstring for details)."""

436

437

if not ScientificIONetCDF_imported or not Numeric_imported:

438

print 'Scientific.IO.NetCDF and Numeric must be installed to convert from NetCDF'

439

return

440

ncfile = RealNetCDF.NetCDFFile(filename,'r')

441

# create dimensions.

442

hasunlimdim = False

443

for dimname,size in ncfile.dimensions.iteritems():

444

self.createDimension(dimname,size)

445

if size == None:

446

hasunlimdim = True

447

unlimdim = dimname

448

# create variables.

449

for varname,ncvar in ncfile.variables.iteritems():

450

if hasattr(ncvar,'least_significant_digit'):

451

lsd = ncvar.least_significant_digit

452

else:

453

lsd = None

454

if unpackshort and hasattr(ncvar,'scale_factor') and hasattr(ncvar,'add_offset'):

455

dounpackshort = True

456

datatype = 'f'

457

else:

458

dounpackshort = False

459

datatype = ncvar.typecode()

460

var = self.createVariable(varname,datatype,ncvar.dimensions,least_significant_digit=lsd,filters=filters)

461

for key,val in ncvar.__dict__.iteritems():

462

if dounpackshort and key in ['add_offset','scale_factor']: continue

463

if dounpackshort and key == 'missing_value': val=1.e30

464

# convert rank-0 Numeric array.to python float/int/string

465

if isinstance(val,type(Numeric.array([1]))) and len(val)==1:

466

val = val[0]

467

setattr(var,key,val)

468

# fill variables with data.

469

nobjects = 0; nbytes = 0 # Initialize counters

470

for varname,ncvar in ncfile.variables.iteritems():

471

var = self.variables[varname]

472

extdim = var._NetCDF_varobj.extdim

473

if extdim >= 0:

474

hasunlimdim = True

475

else:

476

hasunlimdim = False

477

if unpackshort and hasattr(ncvar,'scale_factor') and hasattr(ncvar,'add_offset'):

478

dounpackshort = True

479

else:

480

dounpackshort = False

481

if hasunlimdim:

482

# write data to enlargeable array one chunk of records at a

483

# time (so the whole array doesn't have to be kept in memory).

484

nrowsinbuf = var._NetCDF_varobj._v_maxTuples

485

# The slices parameter for var.__getitem__()

486

slices = [slice(0, dim, 1) for dim in ncvar.shape]

487

# range to copy

488

start = 0; stop = ncvar.shape[extdim]; step = nrowsinbuf

489

if step < 1: step = 1

490

# Start the copy itself

491

for start2 in range(start, stop, step):

492

# Save the records on disk

493

stop2 = start2+step

494

if stop2 > stop:

495

stop2 = stop

496

# Set the proper slice in the extensible dimension

497

slices[extdim] = slice(start2, stop2, step)

498

idata = ncvar[tuple(slices)]

499

if dounpackshort:

500

tmpdata = (ncvar.scale_factor*idata+ncvar.add_offset).astype('f')

501

else:

502

tmpdata = idata

503

if hasattr(ncvar,'missing_value'):

504

tmpdata = Numeric.where(idata >= ncvar.missing_value, 1.e30, tmpdata)

505

var.append(tmpdata)

506

else:

507

idata = ncvar[:]

508

if dounpackshort:

509

tmpdata = (ncvar.scale_factor*idata+ncvar.add_offset).astype('f')

510

else:

511

tmpdata = idata

512

if hasattr(ncvar,'missing_value'):

513

tmpdata = Numeric.where(idata >= ncvar.missing_value, 1.e30, tmpdata)

514

if ncvar.typecode() == 'c':

515

# numarray string arrays with itemsize=1 used for netCDF char arrays.

516

# It is important to set the padding character to NULL

517

# in order to avoid the '' string to become a ' '

518

# after de-serializing. See:

519

# http://sourceforge.net/tracker/index.php?func=detail&aid=1304615&group_id=1369&atid=450446

520

# for more info.

521

# F. Altet 2005-11-07

522

var[:] = numarray.strings.array(tmpdata.tolist(),

523

itemsize=1,

524

padc=_fillvalue_dict[ncvar.typecode()])

525

else:

526

# if data is in a CArray, convert to numarray

527

# (done automatically for EArrays)

528

if isinstance(var._NetCDF_varobj,tables.CArray):

529

tmpdata = tables.utils.convertToNA(tmpdata,var._NetCDF_varobj.atom)

530

var[:] = tmpdata

531

# Increment the counters

532

nobjects += 1

533

nbytes += reduce(lambda x,y:x*y, var._NetCDF_varobj.shape) * var._NetCDF_varobj.itemsize

534

# create global attributes.

535

for key,val in ncfile.__dict__.iteritems():

536

# convert Numeric rank-0 array to a python float/int/string

537

if isinstance(val,type(Numeric.array([1]))) and len(val)==1:

538

val = val[0]

539

# if attribute is a Numeric array, convert to python list.

540

if isinstance(val,type(Numeric.array([1]))) and len(val)>1:

541

val = val.tolist()

542

setattr(self,key,val)

543

# close file.

544

ncfile.close()

545

self.sync()

546

return nobjects, nbytes

547

548

class NetCDFVariable:

549

"""Variable in a netCDF file

550

551

NetCDFVariable objects are constructed by calling the method

552

'createVariable' on the NetCDFFile object.

553

554

NetCDFVariable objects behave much like array objects defined in

555

module Numeric, except that their data resides in a file. Data is

556

read by indexing and written by assigning to an indexed subset;

557

the entire array can be accessed by the index '[:]'.

558

559

Variables with an unlimited dimension are can be compressed on

560

disk (by default, zlib compression (level=6) and the HDF5

561

'shuffle' filter are used). The default can be changed by passing

562

a tables.Filters instance to createVariable via the filters

563

keyword argument. Truncating the data to a precision specified by

564

the least_significant_digit optional keyword argument to

565

createVariable will signficantly improve compression.

566

567

A list of attributes corresponding to variable attributes defined

568

in the netCDF file can be obtained with the ncattrs method.

569

"""

570

571

def __init__(self, varname, NetCDFFile, datatype, dimensions, least_significant_digit=None,expectedsize=1000,filters=None):

572

if datatype not in _netcdftype_dict.keys():

573

raise ValueError, 'datatype must be one of %s'%_netcdftype_dict.keys()

574

self._NetCDF_parent = NetCDFFile

575

_NetCDF_FillValue = _fillvalue_dict[datatype]

576

vardimsizes = []

577

for d in dimensions:

578

vardimsizes.append(NetCDFFile.dimensions[d])

579

extdim = -1; ndim = 0

580

for vardim in vardimsizes:

581

if vardim == None:

582

extdim = ndim

583

break

584

ndim += 1

585

if extdim >= 0:

586

# set shape to 0 for extdim.

587

vardimsizes[extdim] = 0

588

if datatype == 'c':

589

# Special case for Numeric character objects

590

# (on which base Scientific.IO.NetCDF works)

591

atom = tables.StringAtom(shape=tuple(vardimsizes), length=1)

592

else:

593

atom = tables.Atom(dtype=datatype, shape=tuple(vardimsizes))

594

if filters is None:

595

# default filters instance.

596

filters = tables.Filters(complevel=6,complib='zlib',shuffle=1)

597

if extdim >= 0:

598

# check that unlimited dimension is first (extdim=0).

599

#if extdim != 0:

600

# raise ValueError,'unlimited or enlargeable dimension must be most significant (slowest changing, or first) one in order to convert to a true netCDF file'

601

# enlargeable dimension, use EArray

602

self._NetCDF_varobj = NetCDFFile._NetCDF_h5file.createEArray(

603

where=NetCDFFile._NetCDF_h5file.root,

604

name=varname,atom=atom,title=varname,

605

filters=filters,

606

expectedrows=expectedsize)

607

else:

608

# no enlargeable dimension, use CArray

609

self._NetCDF_varobj = NetCDFFile._NetCDF_h5file.createCArray(

610

where=NetCDFFile._NetCDF_h5file.root,

611

name=varname,shape=tuple(vardimsizes),

612

atom=atom,title=varname,filters=filters)

613

# fill with _FillValue

614

if datatype == 'c':

615

# numarray string arrays with itemsize=1 used for char arrays.

616

self[:] = numarray.strings.array(shape=tuple(vardimsizes),itemsize=1)

617

else:

618

self[:] = _NetCDF_FillValue*numarray.ones(tuple(vardimsizes),datatype)

619

if least_significant_digit != None:

620

setattr(self._NetCDF_varobj.attrs,'least_significant_digit',least_significant_digit)

621

setattr(self._NetCDF_varobj.attrs,'dimensions',dimensions)

622

self._NetCDF_FillValue = _NetCDF_FillValue

623

624

def __setitem__(self,key,data):

625

# if assigning to a CArray, convert to numarray.

626

# (done automatically for EArrays)

627

if isinstance(self._NetCDF_varobj,tables.CArray):

628

data = tables.utils.convertToNA(data,self._NetCDF_varobj.atom)

629

if hasattr(self,'least_significant_digit'):

630

self._NetCDF_varobj[key] = _quantize(data,self.least_significant_digit)

631

else:

632

self._NetCDF_varobj[key] = data

633

634

def __getitem__(self,key):

635

return self._NetCDF_varobj[key]

636

637

def __len__(self):

638

return int(self._NetCDF_varobj.shape[0])

639

640

def __setattr__(self,name,value):

641

# if name begins with '_NetCDF_', it is a temporary at the python level

642

# (not stored in the hdf5 file).

643

# dimensions is a read only attribute

644

if name in ['dimensions']:

645

raise KeyError, '"dimensions" is a read-only attribute - cannot modify'

646

if not name.startswith('_NetCDF_'):

647

setattr(self._NetCDF_varobj.attrs,name,value)

648

elif not name.endswith('__'):

649

self.__dict__[name]=value

650

651

def __getattr__(self,name):

652

if name.startswith('__') and name.endswith('__'):

653

raise AttributeError

654

elif name.startswith('_NetCDF_'):

655

return self.__dict__[name]

656

else:

657

if self._NetCDF_varobj.__dict__.has_key(name):

658

return self._NetCDF_varobj.__dict__[name]

659

else:

660

return self._NetCDF_varobj.attrs.__dict__[name]

661

662

def typecode(self):

663

"""

664

return a single character Numeric typecode.

665

Allowed values are

666

'd' == Float64, 'f' == Float32, 'l' == Int32,

667

'i' == Int32, 's' == Int16, '1' == Int8,

668

'c' == StringType (length 1), 'F' == Complex32 and 'D' == Complex64.

669

The corresponding NetCDF data types are

670

'double', 'float', 'int', 'int', 'short', 'byte' and 'character'.

671

('D' and 'F' have no corresponding netCDF data types).

672

"""

673

return _typecode_dict[self._NetCDF_varobj.stype]

674

675

def ncattrs(self):

676

"""return attributes corresponding to netCDF variable attributes"""

677

return [attr for attr in self._NetCDF_varobj.attrs._v_attrnamesuser if attr != 'dimensions']

678

679

def append(self,data):

680

"""

681

Append data along unlimited dimension of a NetCDFVariable.

682

683

The data must have either the same number of dimensions as the NetCDFVariable

684

instance that it is being append to, or one less. If it has one less

685

dimension, it assumed that the missing dimension is a singleton dimension

686

corresponding to the unlimited dimension of the NetCDFVariable.

687

688

If the NetCDFVariable has a least_significant_digit attribute,

689

the data is truncated (quantized) to improve compression.

690

"""

691

if self._NetCDF_parent._NetCDF_mode == 'r':

692

raise IOError, 'file is read only'

693

# if data is not an array, try to make it so.

694

try:

695

datashp = data.shape

696

except:

697

data = numarray.array(data,self.typecode())

698

# check to make sure there is an unlimited dimension.

699

# (i.e. data is in an EArray).

700

extdim = self._NetCDF_varobj.extdim

701

if extdim < 0:

702

raise IndexError, 'variable has no unlimited dimension'

703

# name of unlimited dimension.

704

extdim_name = self.dimensions[extdim]

705

# special case that data array is same

706

# shape as EArray, minus the enlargeable dimension.

707

# if so, add an extra singleton dimension.

708

if len(data.shape) != len(self._NetCDF_varobj.shape):

709

shapem1 = ()

710

for n,dim in enumerate(self._NetCDF_varobj.shape):

711

if n != extdim:

712

shapem1 = shapem1+(dim,)

713

if data.shape == shapem1:

714

shapenew = list(self._NetCDF_varobj.shape)

715

shapenew[extdim]=1

716

data = numarray.reshape(data,shapenew)

717

else:

718

raise IndexError,'data must either have same number of dimensions as variable, or one less (excluding unlimited dimension)'

719

# append the data to the variable object.

720

if hasattr(self,'least_significant_digit'):

721

self._NetCDF_varobj.append(_quantize(data,self.least_significant_digit))

722

else:

723

self._NetCDF_varobj.append(data)

724

725

726

def assignValue(self,value):

727

"""

728

Assigns value to the variable.

729

"""

730

if self._NetCDF_varobj.extdim >=0:

731

self.append(value)

732

else:

733

self[:] = value

734

735

def getValue(self):

736

"""

737

Returns the value of the variable.

738

"""

739

return self[:]

740

741

# only used internally to create netCDF variable objects

742

# from Array objects read in from an hdf5 file.

743

class _NetCDFVariable(NetCDFVariable):

744

def __init__(self, var, NetCDFFile):

745

self._NetCDF_parent = NetCDFFile

746

self._NetCDF_varobj = var

747

self._NetCDF_FillValue = _fillvalue_dict[self.typecode()]

Older »