/[thuban]/branches/WIP-pyshapelib-bramz/Thuban/Model/transientdb.py
ViewVC logotype

Diff of /branches/WIP-pyshapelib-bramz/Thuban/Model/transientdb.py

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 818 by bh, Mon May 5 17:18:31 2003 UTC revision 1511 by bh, Tue Jul 29 14:48:57 2003 UTC
# Line 18  __version__ = "$Revision$" Line 18  __version__ = "$Revision$"
18  # $Source$  # $Source$
19  # $Id$  # $Id$
20    
 import os  
 import weakref  
21  from sqlite import connect  from sqlite import connect
22    
23    from base import TitledObject
24    
25  import table  import table
26    
27  sql_type_map = {  sql_type_map = {
# Line 118  class TransientTableBase(table.OldTableI Line 118  class TransientTableBase(table.OldTableI
118    
119          # Build the CREATE TABLE statement and create the table in the          # Build the CREATE TABLE statement and create the table in the
120          # database          # database
121          table_types = []          table_types = ["id INTEGER PRIMARY KEY"]
122          for col in self.columns:          for col in self.columns:
123              table_types.append("%s %s" % (col.internal_name,              table_types.append("%s %s" % (col.internal_name,
124                                            sql_type_map[col.type]))                                            sql_type_map[col.type]))
# Line 155  class TransientTableBase(table.OldTableI Line 155  class TransientTableBase(table.OldTableI
155      def Column(self, col):      def Column(self, col):
156          return self.column_map[col]          return self.column_map[col]
157    
158        def HasColumn(self, col):
159            """Return whether the table has a column with the given name or index
160            """
161            return self.column_map.has_key(col)
162    
163      def ReadRowAsDict(self, index):      def ReadRowAsDict(self, index):
164            # Implementation Strategy: Executing a completely new select
165            # statement every time this method is called is too slow. The
166            # most important usage is to read the records more or less
167            # sequentially. This happens e.g. when drawing a layer with a
168            # classification where the shapes are drawn in order of the
169            # shape ids. Another pattern is that the same row is requested
170            # several times in a row. This happens in the table view, for
171            # instance.
172    
173            # We can exploit this to make access faster by having one cursor
174            # open all the time and keeping the last row read around in case
175            # the same row is accessed again the next time and if the row
176            # index is larger than the row we have read last we simply fetch
177            # rows from the cursor until we've reached the requested row. If
178            # the requested row index is smaller then we start a new cursor.
179    
180            # FIXME: So far this scheme seems to work well enough. Obvious
181            # improvements would be to start the cursor at exactly the
182            # requested row (should be efficient and easy to do now that the
183            # id is the primary key) and to perhaps to also start a new
184            # cursor if the requested index is much larger than the last row
185            # so that we don't read and discard lots of the rows.
186    
187            # Check whether we have to start a new cursor
188          if self.read_record_cursor is None or index <self.read_record_last_row:          if self.read_record_cursor is None or index <self.read_record_last_row:
189              stmt = ("SELECT %s FROM %s;"              stmt = ("SELECT %s FROM %s;"
190                      % (", ".join([c.internal_name for c in self.columns]),                      % (", ".join([c.internal_name for c in self.columns]),
# Line 179  class TransientTableBase(table.OldTableI Line 208  class TransientTableBase(table.OldTableI
208          self.read_record_last_row = index          self.read_record_last_row = index
209          return dict(zip(self.orig_names, result))          return dict(zip(self.orig_names, result))
210    
211        def ReadValue(self, row, col):
212            """Return the value of the specified row and column
213    
214            The col parameter may be the index of the column or its name.
215            """
216            # Depending on the actual access patterns of the table data, it
217            # might be a bit faster in some circumstances to not implement
218            # this via ReadRowAsDict, but this simple implementation should
219            # be fast enough for most purposes.
220            return self.ReadRowAsDict(row)[self.column_map[col].name]
221    
222      def ValueRange(self, col):      def ValueRange(self, col):
223          col = self.column_map[col]          col = self.column_map[col]
224          iname = col.internal_name          iname = col.internal_name
# Line 200  class TransientTableBase(table.OldTableI Line 240  class TransientTableBase(table.OldTableI
240              result.append(row[0])              result.append(row[0])
241          return result          return result
242    
243        def Width(self, col):
244            """Return the maximum width of values in the column
245    
246            The return value is the the maximum length of string
247            representation of the values in the column (represented by index
248            or name).
249            """
250            max = 0
251    
252            type  = self.column_map[col].type
253            iname = self.column_map[col].internal_name
254            cursor = self.db.cursor()
255            cursor.execute("SELECT %s FROM %s;" % (iname, self.tablename))
256            values = [ i[0] for i in cursor.fetchall()]
257            if not values:
258                return None
259    
260            if type == table.FIELDTYPE_DOUBLE:
261                format = "%.12f"
262            elif type == table.FIELDTYPE_INT:
263                format = "%d"
264            else:
265                format = "%s"
266            for value in values:
267                if value is None: continue
268                l = len(format % value)
269                if l > max:
270                    max = l
271    
272            return max
273    
274        def SimpleQuery(self, left, comparison, right):
275            """Return the indices of all rows that matching a condition.
276    
277            Parameters:
278               left -- The column object for the left side of the comparison
279    
280               comparison -- The comparison operator as a string. It must be
281                             one of '==', '!=', '<', '<=', '>=', '>'
282    
283               right -- The right hand side of the comparison. It must be
284                        either a column object or a value, i.e. a string,
285                        int or float.
286    
287            The return value is a sorted list of the indices of the rows
288            where the condition is true.
289            """
290            if comparison not in ("==", "!=", "<", "<=", ">=", ">"):
291                raise ValueError("Comparison operator %r not allowed" % comparison)
292    
293            if hasattr(right, "internal_name"):
294                right_template = right.internal_name
295                params = ()
296            else:
297                right_template = "%s"
298                params = (right,)
299    
300            query = "SELECT id FROM %s WHERE %s %s %s ORDER BY id;" \
301                    % (self.tablename, left.internal_name, comparison,
302                       right_template)
303    
304            cursor = self.db.cursor()
305            cursor.execute(query, params)
306            result = []
307            while 1:
308                row = cursor.fetchone()
309                if row is None:
310                    break
311                result.append(row[0])
312            return result
313    
314        def Dependencies(self):
315            """Placeholder for a method in a derived class.
316    
317            Return a sequence with the tables and other data objects that
318            self depends on.
319            """
320            raise NotImplementedError
321    
322    
323  class TransientTable(TransientTableBase):  class TransientTable(TitledObject, TransientTableBase):
324    
325      """A Table in a transient DB that starts as the copy of a Thuban Table."""      """A Table in a transient DB that starts as the copy of a Thuban Table."""
326    
# Line 212  class TransientTable(TransientTableBase) Line 331  class TransientTable(TransientTableBase)
331          interface.          interface.
332          """          """
333          TransientTableBase.__init__(self, transient_db)          TransientTableBase.__init__(self, transient_db)
334            TitledObject.__init__(self, table.Title())
335          self.create(table)          self.create(table)
336    
337      def create(self, table):      def create(self, table):
# Line 222  class TransientTable(TransientTableBase) Line 342  class TransientTable(TransientTableBase)
342          TransientTableBase.create(self, columns)          TransientTableBase.create(self, columns)
343    
344          # copy the input table to the transient db          # copy the input table to the transient db
345          insert_template = "INSERT INTO %s (%s) VALUES (%s);" \  
346            # A key to insert to use for the formatting of the insert
347            # statement. The key must not be equal to any of the column
348            # names so we construct one by building a string of x's that is
349            # longer than any of the column names
350            id_key = max([len(col.name) for col in self.columns]) * "x"
351    
352            insert_template = "INSERT INTO %s (id, %s) VALUES (%%(%s)s, %s);" \
353                                 % (self.tablename,                                 % (self.tablename,
354                                    ", ".join([col.internal_name                                    ", ".join([col.internal_name
355                                               for col in self.columns]),                                               for col in self.columns]),
356                                      id_key,
357                                    ", ".join(["%%(%s)s" % col.name                                    ", ".join(["%%(%s)s" % col.name
358                                               for col in self.columns]))                                               for col in self.columns]))
359          cursor = self.db.cursor()          cursor = self.db.cursor()
360          for i in range(table.NumRows()):          for i in range(table.NumRows()):
361              cursor.execute(insert_template, table.ReadRowAsDict(i))              row = table.ReadRowAsDict(i)
362                row[id_key] = i
363                cursor.execute(insert_template, row)
364          self.db.conn.commit()          self.db.conn.commit()
365    
366    
367    
368  class TransientJoinedTable(TransientTableBase):  class TransientJoinedTable(TitledObject, TransientTableBase):
369    
370      """A Table in the transient DB that contains a join of two tables"""      """A Table in the transient DB that contains a join of two tables"""
371    
372      def __init__(self, transient_db, left_table, left_field,      def __init__(self, transient_db, left_table, left_field,
373                   right_table, right_field = None):                   right_table, right_field = None, outer_join = False):
374          """Create a new table in the transient DB as a join of two tables.          """Create a new table in the transient DB as a join of two tables.
375    
376          Both input tables, left_table and right_table must have a          Both input tables, left_table and right_table must have a
377          transient_table method that returns a table object for a table          transient_table method that returns a table object for a table
378          in the trnsient database. The join is performed on the condition          in the transient database. The join is performed on the condition
379          that the value of the left_field column the the left table is          that the value of the left_field column the the left table is
380          equal to the value of the right_field in the right_table.          equal to the value of the right_field in the right_table.
381    
382          The joined table contains all columns of the input tables with          The joined table contains all columns of the input tables,
383          one exception: Any column in the right_table with the same name          however, the column names of the right table may be changed
384          as one of the columns in the left_table will be omitted. This is          slightly to make them unique in the joined table. This is
385          somewhat of an implementation detail, but is done so that the          currently done by appending a sufficient number of underscores
386          column names of the joined table can be the same as the column          ('_').
         names of the input tables without having to create prefixes.  
387          """          """
388          TransientTableBase.__init__(self, transient_db)          TransientTableBase.__init__(self, transient_db)
389            self.dependencies = (left_table, right_table)
390          self.left_table = left_table.transient_table()          self.left_table = left_table.transient_table()
391          self.left_field = left_field          self.left_field = left_field
392          self.right_table = right_table.transient_table()          self.right_table = right_table.transient_table()
# Line 264  class TransientJoinedTable(TransientTabl Line 394  class TransientJoinedTable(TransientTabl
394              self.right_field = right_field              self.right_field = right_field
395          else:          else:
396              self.right_field = self.left_field              self.right_field = self.left_field
397            self.outer_join = outer_join
398    
399            title = "Join of %(left)s and %(right)s" \
400                    % {"left": self.left_table.Title(),
401                       "right": self.right_table.Title()}
402            TitledObject.__init__(self, title)
403    
404          self.create()          self.create()
405    
406      def create(self):      def create(self):
# Line 272  class TransientJoinedTable(TransientTabl Line 409  class TransientJoinedTable(TransientTabl
409    
410          self.right_table.ensure_index(self.right_field)          self.right_table.ensure_index(self.right_field)
411    
412            # determine the internal column names to join on before
413            # coalescing the column information because if the external
414            # column names are the same they will be mapped to the same
415            # internal name afterwards.
416            internal_left_col = self.left_table.orig_to_internal[self.left_field]
417            internal_right_col =self.right_table.orig_to_internal[self.right_field]
418    
419          # Coalesce the column information          # Coalesce the column information
420          visited = {}          visited = {}
421          columns = []          columns = []
422          for col in self.left_table.columns + self.right_table.columns:          newcolumns = []
423              if col.name in visited:          for table in (self.left_table, self.right_table):
424                  continue              for col in table.Columns():
425              columns.append(col)                  colname = col.name
426          TransientTableBase.create(self, columns)                  # We can't allow multiple columns with the same
427                    # original name, so append '_' to this one until
428                    # it is unique.
429                    # FIXME: There should be a better solution.
430                    while colname in visited:
431                        colname = colname + '_'
432                    columns.append((table.tablename, col))
433                    newcol = ColumnReference(colname, col.type,
434                                                "Col%03d" % (len(newcolumns)+1))
435                    newcolumns.append(newcol)
436                    visited[colname] = 1
437            TransientTableBase.create(self, newcolumns)
438    
439          # Copy the joined data to the table.          # Copy the joined data to the table.
440          internal_names = [col.internal_name for col in self.columns]          newinternal_names = [col.internal_name for col in self.columns]
441          stmt = "INSERT INTO %s (%s) SELECT %s FROM %s JOIN %s ON %s = %s;" \          internal_references = ["%s.%s" % (table, col.internal_name)
442                 % (self.tablename,                                                      for table, col in columns]
443                    ", ".join(internal_names),          if self.outer_join:
444                    ", ".join(internal_names),              join_operator = 'LEFT OUTER JOIN'
445                    self.left_table.tablename,          else:
446                    self.right_table.tablename,              join_operator = 'JOIN'
447                    self.orig_to_internal[self.left_field],          stmt = ("INSERT INTO %s (id, %s) SELECT %s.id, %s FROM %s"
448                    self.orig_to_internal[self.right_field])                  " %s %s ON %s.%s = %s.%s;"
449                    % (self.tablename,
450                       ", ".join(newinternal_names),
451                       self.left_table.tablename,
452                       ", ".join(internal_references),
453                       self.left_table.tablename,
454                       join_operator,
455                       self.right_table.tablename,
456                       self.left_table.tablename,
457                       internal_left_col,
458                       self.right_table.tablename,
459                       internal_right_col))
460          self.db.execute(stmt)          self.db.execute(stmt)
461    
462        def Dependencies(self):
463            """Return a tuple with the two tables the join depends on."""
464            return self.dependencies
465    
466        def JoinType(self):
467            """Return the type of the join (either 'INNER' or 'LEFT OUTER')"""
468            if self.outer_join:
469                return "LEFT OUTER"
470            else:
471                return "INNER"
472    
473    
474  class AutoTransientTable(table.OldTableInterfaceMixin):  class AutoTransientTable(TitledObject, table.OldTableInterfaceMixin):
475    
476      """Table that copies data to a transient table on demand.      """Table that copies data to a transient table on demand.
477    
# Line 303  class AutoTransientTable(table.OldTableI Line 480  class AutoTransientTable(table.OldTableI
480      """      """
481    
482      def __init__(self, transient_db, table):      def __init__(self, transient_db, table):
483            TitledObject.__init__(self, table.Title())
484          self.transient_db = transient_db          self.transient_db = transient_db
485          self.table = table          self.table = table
486          self.t_table = None          self.t_table = None
# Line 313  class AutoTransientTable(table.OldTableI Line 491  class AutoTransientTable(table.OldTableI
491      def Column(self, col):      def Column(self, col):
492          return self.table.Column(col)          return self.table.Column(col)
493    
494        def HasColumn(self, col):
495            """Return whether the table has a column with the given name or index
496            """
497            return self.table.HasColumn(col)
498    
499      def NumRows(self):      def NumRows(self):
500          return self.table.NumRows()          return self.table.NumRows()
501    
# Line 323  class AutoTransientTable(table.OldTableI Line 506  class AutoTransientTable(table.OldTableI
506          """Return the record no. record as a dict mapping field names to values          """Return the record no. record as a dict mapping field names to values
507          """          """
508          if self.t_table is not None:          if self.t_table is not None:
509              return self.t_table.read_record(record)              return self.t_table.ReadRowAsDict(record)
510          else:          else:
511              return self.table.ReadRowAsDict(record)              return self.table.ReadRowAsDict(record)
512    
513        def ReadValue(self, row, col):
514            """Return the value of the specified row and column
515    
516            The col parameter may be the index of the column or its name.
517            """
518            if self.t_table is not None:
519                return self.t_table.ReadValue(row, col)
520            else:
521                return self.table.ReadValue(row, col)
522    
523      def copy_to_transient(self):      def copy_to_transient(self):
524          """Internal: Create a transient table and copy the data into it"""          """Internal: Create a transient table and copy the data into it"""
525          self.t_table = TransientTable(self.transient_db, self)          self.t_table = TransientTable(self.transient_db, self)
# Line 342  class AutoTransientTable(table.OldTableI Line 535  class AutoTransientTable(table.OldTableI
535      def ValueRange(self, col):      def ValueRange(self, col):
536          if self.t_table is None:          if self.t_table is None:
537              self.copy_to_transient()              self.copy_to_transient()
538          (min, row), (max, row) = self.t_table.field_range(col)          return self.t_table.ValueRange(col)
         return min, max  
539    
540      def UniqueValues(self, colname):      def UniqueValues(self, col):
541          if self.t_table is None:          if self.t_table is None:
542              self.copy_to_transient()              self.copy_to_transient()
543          return self.t_table.GetUniqueValues(colname)          return self.t_table.UniqueValues(col)
544    
545        def SimpleQuery(self, left, comparison, right):
546            if self.t_table is None:
547                self.copy_to_transient()
548            # Make sure to use the column object of the transient table. The
549            # left argument is always a column object so we can just ask the
550            # t_table for the right object.
551            if hasattr(right, "name"):
552                return self.t_table.SimpleQuery(self.t_table.Column(left.name),
553                                                comparison,
554                                                self.t_table.Column(right.name))
555            else:
556                return self.t_table.SimpleQuery(self.t_table.Column(left.name),
557                                                comparison, right)
558    
559        def Dependencies(self):
560            """Return a tuple containing the original table"""
561            return (self.table,)
562    
563        def Width(self, col):
564            return self.table.Width(col)

Legend:
Removed from v.818  
changed lines
  Added in v.1511

[email protected]
ViewVC Help
Powered by ViewVC 1.1.26