/[thuban]/branches/WIP-pyshapelib-bramz/Thuban/Model/table.py

Diff of /branches/WIP-pyshapelib-bramz/Thuban/Model/table.py

Parent Directory | Revision Log | View Patch Patch

-revision 994 by bh,
Thu May 22 18:05:16 2003 UTC
+revision 1961 by bh,
Wed Nov 19 15:46:03 2003 UTC
 Line 2
  # Authors:
  # Bernhard Herzog <[email protected]>
  # Jan-Oliver Wagner <[email protected]>
+ # Frank Koormann <[email protected]>
  #
  # This program is free software under the GPL (>=v2)
  # Read the file COPYING coming with Thuban for details.
-Line 12 
 Classes for handling tables of data.
+Line 13 
 Classes for handling tables of data.
  __version__ = "$Revision$"
+ import os
  import inspect
  import warnings
+ from base import TitledObject
  import dbflib
  # the field types supported by a Table instance.
-Line 29 
 dbflib_fieldtypes = {dbflib.FTString: FI
+Line 33 
 dbflib_fieldtypes = {dbflib.FTString: FI
                       dbflib.FTDouble: FIELDTYPE_DOUBLE}
- class OldTableInterfaceMixin:
-     """Mixin to implement the old table interface using the new one"""
-     def __deprecation_warning(self):
-         """Issue a DeprecationWarning for code hat uses the old interface"""
-         callername = inspect.currentframe().f_back.f_code.co_name
-         warnings.warn("The %s method of the old table interface"
-                       " is deprecated" % callername,
-                       DeprecationWarning, stacklevel = 3)
-     def record_count(self):
-         self.__deprecation_warning()
-         return self.NumRows()
-     def field_count(self):
-         self.__deprecation_warning()
-         return self.NumColumns()
-     def field_info(self, field):
-         """Return a tuple (type, name, width, prec) for the field no. field
-         type is the data type of the field, name the name, width the
-         field width in characters and prec the decimal precision. width
-         and prec will be zero if the information returned by the Column
-         method doesn't provide values for them.
-         """
-         self.__deprecation_warning()
-         col = self.Column(field)
-         return (col.type, col.name,
-                getattr(col, "width", 0), getattr(col, "prec", 0))
-     def field_info_by_name(self, col):
-         self.__deprecation_warning()
-         try:
-             return self.field_info(col)
-         except KeyError:
-             # FIXME: It may be that field_info raises other exceptions
-             # when the name is not a valid column name.
-             return None
-     def field_range(self, fieldName):
-         self.__deprecation_warning()
-         min, max = self.ValueRange(fieldName)
-         return ((min, None), (max, None))
-     def GetUniqueValues(self, field):
-         self.__deprecation_warning()
-         return self.UniqueValues(field)
-     def read_record(self, r):
-         self.__deprecation_warning()
-         return self.ReadRowAsDict(r)
  class DBFColumn:
      """Description of a column in a DBFTable
-Line 107 
 class DBFColumn:
+Line 55 
 class DBFColumn:
          self.index = index
- class DBFTable(OldTableInterfaceMixin):
+ class DBFTable(TitledObject):
      """
      Table interface for the data in a DBF file
-Line 128 
 class DBFTable(OldTableInterfaceMixin):
+Line 76 
 class DBFTable(OldTableInterfaceMixin):
      # work because a DBF file object buffers some data
      def __init__(self, filename):
-         self.filename = filename
+         self.filename = os.path.abspath(filename)
+         # Omit the extension in the title as it's not really needed and
+         # it can be confusing because dbflib removes extensions and
+         # appends some variations of '.dbf' before it tries to open the
+         # file. So the title could be e.g. myshapefile.shp when the real
+         # filename is myshapefile.dbf
+         title = os.path.splitext(os.path.basename(self.filename))[0]
+         TitledObject.__init__(self, title)
          self.dbf = dbflib.DBFFile(filename)
          # If true, self.dbf is open for writing.
-Line 174 
 class DBFTable(OldTableInterfaceMixin):
+Line 131 
 class DBFTable(OldTableInterfaceMixin):
          """
          return self.column_map.has_key(col)
-     def ReadRowAsDict(self, row):
+     def RowIdToOrdinal(self, gid):
-         """Return the entire row as a dictionary with column names as keys"""
+         """Return the row ordinal given its id
+         Since for DBFTables the row id is the row number, return the
+         value unchanged.
+         """
+         return gid
+     def RowOrdinalToId(self, num):
+         """Return the rowid for given its ordinal
+         Since for DBFTables the row id is the row number, return the
+         value unchanged.
+         """
+         return num
+     def ReadRowAsDict(self, row, row_is_ordinal = 0):
+         """Return the entire row as a dictionary with column names as keys
+         The row_is_ordinal is ignored for DBF tables because the row id
+         is always the row number.
+         """
          return self.dbf.read_record(row)
-     def ReadValue(self, row, col):
+     def ReadValue(self, row, col, row_is_ordinal = 0):
          """Return the value of the specified row and column
          The col parameter may be the index of the column or its name.
+         The row_is_ordinal is ignored for DBF tables because the row id
+         is always the row number.
          """
-         return self.dbf.read_record(row)[self.column_map[col].name]
+         return self.dbf.read_attribute(row, self.column_map[col].index)
      def ValueRange(self, col):
          """Return the minimum and maximum values of the values in the column
-Line 224 
 class DBFTable(OldTableInterfaceMixin):
+Line 204 
 class DBFTable(OldTableInterfaceMixin):
      # DBF specific interface parts.
+     def Width(self, col):
+         """Return column width"""
+         return self.column_map[col].width
      def Destroy(self):
          self.dbf.close()
          self.dbf = None
-Line 261 
 class MemoryColumn:
+Line 245 
 class MemoryColumn:
          self.type = type
          self.index = index
- class MemoryTable(OldTableInterfaceMixin):
+ class MemoryTable(TitledObject):
      """Very simple table implementation that operates on a list of tuples"""
-Line 273 
 class MemoryTable(OldTableInterfaceMixin
+Line 257 
 class MemoryTable(OldTableInterfaceMixin
          data -- List of tuples, one for each row of data
          """
          self.data = data
+         title = 'MemoryTable'
+         TitledObject.__init__(self, title)
          # Create the column information objects
          self.columns = []
-Line 312 
 class MemoryTable(OldTableInterfaceMixin
+Line 298 
 class MemoryTable(OldTableInterfaceMixin
          """Return the number of rows in the table"""
          return len(self.data)
-     def ReadValue(self, row, col):
+     def RowIdToOrdinal(self, gid):
+         """Return the row ordinal given its id
+         Since for MemoryTables the row id is the row number, return the
+         value unchanged.
+         """
+         return gid
+     def RowOrdinalToId(self, num):
+         """Return the rowid for given its ordinal
+         Since for MemoryTables the row id is the row number, return the
+         value unchanged.
+         """
+         return num
+     def ReadValue(self, row, col, row_is_ordinal = 0):
          """Return the value of the specified row and column
          The col parameter may be the index of the column or its name.
+         The row_is_ordinal is ignored for DBF tables because the row id
+         is always the row number.
          """
          return self.data[row][self.column_map[col].index]
-     def ReadRowAsDict(self, index):
+     def ReadRowAsDict(self, index, row_is_ordinal = 0):
-         """Return the entire row as a dictionary with column names as keys"""
+         """Return the entire row as a dictionary with column names as keys
+         The row_is_ordinal is ignored for DBF tables because the row id
+         is always the row number.
+         """
          return dict([(col.name, self.data[index][col.index])
                        for col in self.columns])
-Line 339 
 class MemoryTable(OldTableInterfaceMixin
+Line 348 
 class MemoryTable(OldTableInterfaceMixin
          return min(values), max(values)
      def UniqueValues(self, col):
-         """Return a sorted list of all unique values in the column col"""
+         """Return a sorted list of all unique values in the column col
+         col can be either column index or name.
+         """
          dict = {}
          for i in range(self.NumRows()):
-Line 350 
 class MemoryTable(OldTableInterfaceMixin
+Line 362 
 class MemoryTable(OldTableInterfaceMixin
          values.sort()
          return values
+     def Width(self, col):
+         """Return the maximum width of values in the column
+         The return value is the the maximum length of string
+         representation of the values in the column (represented by index
+         or name).
+         """
+         max = 0
+         type  = self.column_map[col].type
+         index = self.column_map[col].index
+         values = [row[index] for row in self.data]
+         if not values:
+             return None
+         if type == FIELDTYPE_DOUBLE:
+             format = "%.12f"
+         elif type == FIELDTYPE_INT:
+             format = "%d"
+         else:
+             format = "%s"
+         for value in values:
+             l = len(format % value)
+             if l > max:
+                 max = l
+         return max
      def Dependencies(self):
          """Return an empty sequence. The MemoryTable doesn't depend on anything
          """
-Line 361 
 class MemoryTable(OldTableInterfaceMixin
+Line 401 
 class MemoryTable(OldTableInterfaceMixin
          # TODO: Allow values to be a dictionary and write the single
          # fields that are specified.
          self.data[record] = values
+ def _find_dbf_column_names(names):
+     """Determine the column names to use in a DBF file
+     DBF files have a length limit of 10 characters on the column names
+     so when writing an arbitrary Thuban table to a DBF file we may have
+     we may have to rename some of the columns making sure that they're
+     unique in the DBF file too.
+     Names that are already short enough will stay the same. Longer names
+     will be truncated to 10 characters or if that isn't unique it will
+     be truncated more and filled up with digits.
+     The parameter names should be a list of the column names. The return
+     value will be a dictionary mapping the names in the input list to
+     the names to use in the DBF file.
+     """
+     # mapping from the original names in table to the names in the DBF
+     # file
+     name_map = {}
+     # First, we keep all names that are already short enough
+     for i in range(len(names) - 1, -1, -1):
+         if len(names[i]) <= 10:
+             name_map[names[i]] = names[i]
+             del names[i]
+     # dict used as a set of all names already used as DBF column names
+     used = name_map.copy()
+     # Go through all longer names. If the name truncated to 10
+     # characters is not used already, we use that. Otherwise we truncate
+     # it more and append numbers until we get an unused name
+     for name in names:
+         truncated = name[:10]
+         num = 0; numstr = ""
+         #print "truncated", truncated, num
+         while truncated in used and len(numstr) < 10:
+             num += 1
+             numstr = str(num)
+             truncated = name[:10 - len(numstr)] + numstr
+             #print "truncated", truncated, num
+         if len(numstr) >= 10:
+             # This case should never happen in practice as tables with
+             # 10^10 columns seem very unlikely :)
+             raise ValueError("Can't find unique dbf column name")
+         name_map[name] = truncated
+         used[truncated] = 1
+     return name_map
+ def table_to_dbf(table, filename, rows = None):
+     """Create the dbf file filename from the table.
+     If rows is not None (the default) then it must be a list of row
+     indices to be saved to the file, otherwise all rows are saved.
+     """
+     dbf = dbflib.create(filename)
+     dbflib_fieldtypes = {FIELDTYPE_STRING: dbflib.FTString,
+                          FIELDTYPE_INT: dbflib.FTInteger,
+                          FIELDTYPE_DOUBLE: dbflib.FTDouble}
+     name_map = _find_dbf_column_names([col.name for col in table.Columns()])
+     # Initialise the header. Distinguish between DBFTable and others.
+     for col in table.Columns():
+         width = table.Width(col.name)
+         if col.type == FIELDTYPE_DOUBLE:
+             prec = getattr(col, "prec", 12)
+         else:
+             prec = 0
+         dbf.add_field(name_map[col.name], dbflib_fieldtypes[col.type],
+                       width, prec)
+     if rows is None:
+         rows = range(table.NumRows())
+     recNum = 0
+     for i in rows:
+         record = {}
+         for key, value in table.ReadRowAsDict(i).items():
+             record[name_map[key]] = value
+         dbf.write_record(recNum, record)
+         recNum += 1
+     dbf.close()
+ def table_to_csv(table, filename, rows = None):
+     """Export table to csv file.
+     If rows is not None (the default) then it must be a list of row
+     indices to be saved to the file, otherwise all rows are saved.
+     """
+     file = open(filename,"w")
+     columns = table.Columns()
+     if columns:
+         header = "#%s" % columns[0].name
+         for col in columns[1:]:
+             header = header + ",%s" % col.name
+         header = header + "\n"
+         file.write(header)
+         if rows is None:
+             rows = range(table.NumRows())
+         for i in rows:
+             record = table.ReadRowAsDict(i)
+             if len(record):
+                 line = "%s" % record[columns[0].name]
+                 for col in columns[1:]:
+                     line = line + ",%s" % record[col.name]
+             line = line + "\n"
+             file.write(line)
+     file.close()

 Legend:



Removed from v.994
 


changed lines


 
Added in v.1961
 Legend:



Removed from v.994
 


changed lines


 
Added in v.1961
-Removed from v.994
+Added in v.1961

[email protected]	ViewVC Help
Powered by ViewVC 1.1.26