/[thuban]/branches/WIP-pyshapelib-bramz/Thuban/Model/table.py

Diff of /branches/WIP-pyshapelib-bramz/Thuban/Model/table.py

Parent Directory | Revision Log | View Patch Patch

-revision 984 by bh,
Thu May 22 16:37:48 2003 UTC
+revision 1599 by bh,
Mon Aug 18 12:45:28 2003 UTC
 Line 2
  # Authors:
  # Bernhard Herzog <[email protected]>
  # Jan-Oliver Wagner <[email protected]>
+ # Frank Koormann <[email protected]>
  #
  # This program is free software under the GPL (>=v2)
  # Read the file COPYING coming with Thuban for details.
-Line 12 
 Classes for handling tables of data.
+Line 13 
 Classes for handling tables of data.
  __version__ = "$Revision$"
+ import os
  import inspect
  import warnings
+ from base import TitledObject
  import dbflib
  # the field types supported by a Table instance.
-Line 107 
 class DBFColumn:
+Line 111 
 class DBFColumn:
          self.index = index
- class DBFTable(OldTableInterfaceMixin):
+ class DBFTable(TitledObject, OldTableInterfaceMixin):
      """
      Table interface for the data in a DBF file
-Line 128 
 class DBFTable(OldTableInterfaceMixin):
+Line 132 
 class DBFTable(OldTableInterfaceMixin):
      # work because a DBF file object buffers some data
      def __init__(self, filename):
-         self.filename = filename
+         self.filename = os.path.abspath(filename)
+         # Omit the extension in the title as it's not really needed and
+         # it can be confusing because dbflib removes extensions and
+         # appends some variations of '.dbf' before it tries to open the
+         # file. So the title could be e.g. myshapefile.shp when the real
+         # filename is myshapefile.dbf
+         title = os.path.splitext(os.path.basename(self.filename))[0]
+         TitledObject.__init__(self, title)
          self.dbf = dbflib.DBFFile(filename)
          # If true, self.dbf is open for writing.
-Line 224 
 class DBFTable(OldTableInterfaceMixin):
+Line 237 
 class DBFTable(OldTableInterfaceMixin):
      # DBF specific interface parts.
+     def Width(self, col):
+         """Return column width"""
+         return self.column_map[col].width
      def Destroy(self):
          self.dbf.close()
          self.dbf = None
-Line 249 
 class DBFTable(OldTableInterfaceMixin):
+Line 266 
 class DBFTable(OldTableInterfaceMixin):
          self.dbf.write_record(record, values)
          self.dbf.commit()
+     def FileName(self):
+         """Return the filename the DBFTable was instantiated with"""
+         return self.filename
  class MemoryColumn:
-Line 258 
 class MemoryColumn:
+Line 278 
 class MemoryColumn:
          self.type = type
          self.index = index
- class MemoryTable(OldTableInterfaceMixin):
+ class MemoryTable(TitledObject, OldTableInterfaceMixin):
      """Very simple table implementation that operates on a list of tuples"""
-Line 270 
 class MemoryTable(OldTableInterfaceMixin
+Line 290 
 class MemoryTable(OldTableInterfaceMixin
          data -- List of tuples, one for each row of data
          """
          self.data = data
+         title = 'MemoryTable'
+         TitledObject.__init__(self, title)
          # Create the column information objects
          self.columns = []
-Line 336 
 class MemoryTable(OldTableInterfaceMixin
+Line 358 
 class MemoryTable(OldTableInterfaceMixin
          return min(values), max(values)
      def UniqueValues(self, col):
-         """Return a sorted list of all unique values in the column col"""
+         """Return a sorted list of all unique values in the column col
+         col can be either column index or name.
+         """
          dict = {}
          for i in range(self.NumRows()):
-Line 347 
 class MemoryTable(OldTableInterfaceMixin
+Line 372 
 class MemoryTable(OldTableInterfaceMixin
          values.sort()
          return values
+     def Width(self, col):
+         """Return the maximum width of values in the column
+         The return value is the the maximum length of string
+         representation of the values in the column (represented by index
+         or name).
+         """
+         max = 0
+         type  = self.column_map[col].type
+         index = self.column_map[col].index
+         values = [row[index] for row in self.data]
+         if not values:
+             return None
+         if type == FIELDTYPE_DOUBLE:
+             format = "%.12f"
+         elif type == FIELDTYPE_INT:
+             format = "%d"
+         else:
+             format = "%s"
+         for value in values:
+             l = len(format % value)
+             if l > max:
+                 max = l
+         return max
      def Dependencies(self):
          """Return an empty sequence. The MemoryTable doesn't depend on anything
          """
-Line 358 
 class MemoryTable(OldTableInterfaceMixin
+Line 411 
 class MemoryTable(OldTableInterfaceMixin
          # TODO: Allow values to be a dictionary and write the single
          # fields that are specified.
          self.data[record] = values
+ def _find_dbf_column_names(names):
+     """Determine the column names to use in a DBF file
+     DBF files have a length limit of 10 characters on the column names
+     so when writing an arbitrary Thuban table to a DBF file we may have
+     we may have to rename some of the columns making sure that they're
+     unique in the DBF file too.
+     Names that are already short enough will stay the same. Longer names
+     will be truncated to 10 characters or if that isn't unique it will
+     be truncated more and filled up with digits.
+     The parameter names should be a list of the column names. The return
+     value will be a dictionary mapping the names in the input list to
+     the names to use in the DBF file.
+     """
+     # mapping from the original names in table to the names in the DBF
+     # file
+     name_map = {}
+     # First, we keep all names that are already short enough
+     for i in range(len(names) - 1, -1, -1):
+         if len(names[i]) <= 10:
+             name_map[names[i]] = names[i]
+             del names[i]
+     # dict used as a set of all names already used as DBF column names
+     used = name_map.copy()
+     # Go through all longer names. If the name truncated to 10
+     # characters is not used already, we use that. Otherwise we truncate
+     # it more and append numbers until we get an unused name
+     for name in names:
+         truncated = name[:10]
+         num = 0; numstr = ""
+         #print "truncated", truncated, num
+         while truncated in used and len(numstr) < 10:
+             num += 1
+             numstr = str(num)
+             truncated = name[:10 - len(numstr)] + numstr
+             #print "truncated", truncated, num
+         if len(numstr) >= 10:
+             # This case should never happen in practice as tables with
+             # 10^10 columns seem very unlikely :)
+             raise ValueError("Can't find unique dbf column name")
+         name_map[name] = truncated
+         used[truncated] = 1
+     return name_map
+ def table_to_dbf(table, filename, rows = None):
+     """Create the dbf file filename from the table.
+     If rows is not None (the default) then it must be a list of row
+     indices to be saved to the file, otherwise all rows are saved.
+     """
+     dbf = dbflib.create(filename)
+     dbflib_fieldtypes = {FIELDTYPE_STRING: dbflib.FTString,
+                          FIELDTYPE_INT: dbflib.FTInteger,
+                          FIELDTYPE_DOUBLE: dbflib.FTDouble}
+     name_map = _find_dbf_column_names([col.name for col in table.Columns()])
+     # Initialise the header. Distinguish between DBFTable and others.
+     for col in table.Columns():
+         width = table.Width(col.name)
+         if col.type == FIELDTYPE_DOUBLE:
+             prec = getattr(col, "prec", 12)
+         else:
+             prec = 0
+         dbf.add_field(name_map[col.name], dbflib_fieldtypes[col.type],
+                       width, prec)
+     if rows is None:
+         rows = range(table.NumRows())
+     recNum = 0
+     for i in rows:
+         record = {}
+         for key, value in table.ReadRowAsDict(i).items():
+             record[name_map[key]] = value
+         dbf.write_record(recNum, record)
+         recNum += 1
+     dbf.close()
+ def table_to_csv(table, filename, rows = None):
+     """Export table to csv file.
+     If rows is not None (the default) then it must be a list of row
+     indices to be saved to the file, otherwise all rows are saved.
+     """
+     file = open(filename,"w")
+     columns = table.Columns()
+     if columns:
+         header = "#%s" % columns[0].name
+         for col in columns[1:]:
+             header = header + ",%s" % col.name
+         header = header + "\n"
+         file.write(header)
+         if rows is None:
+             rows = range(table.NumRows())
+         for i in rows:
+             record = table.ReadRowAsDict(i)
+             if len(record):
+                 line = "%s" % record[columns[0].name]
+                 for col in columns[1:]:
+                     line = line + ",%s" % record[col.name]
+             line = line + "\n"
+             file.write(line)
+     file.close()

 Legend:



Removed from v.984
 


changed lines


 
Added in v.1599
 Legend:



Removed from v.984
 


changed lines


 
Added in v.1599
-Removed from v.984
+Added in v.1599

[email protected]	ViewVC Help
Powered by ViewVC 1.1.26