tablediff.py
author Radek Brich <radek.brich@devl.cz>
Thu, 31 May 2012 11:28:41 +0200
changeset 38 d3593869d624
parent 35 e7f79c4a27ce
child 41 6aad5e35efe8
permissions -rwxr-xr-x
Update bigtables tool: scan all schemas.

#!/usr/bin/env python3.2
#
# Print differencies between data in two tables of same schema.
#
# Requirements:
#  * First column of both tables must be numerical primary key.
#  * Destination table must contain all columns from source table.
#    Order is not important.
#

from pgtoolkit import toolbase, pgmanager, pgdatadiff
from pgtoolkit.highlight import *


class TableDiffTool(toolbase.SrcDstTablesTool):
    def __init__(self):
        toolbase.SrcDstTablesTool.__init__(self, name='tablediff', desc='Table diff.')
        
        self.parser.add_argument('--sql', action='store_true', help='Output is SQL script.')
        self.parser.add_argument('--rowcount', action='store_true', help='Compare number of rows.')
        
        self.init()

    def main(self):
        srcconn = self.pgm.get_conn('src')
        dstconn = self.pgm.get_conn('dst')
        
        dd = pgdatadiff.PgDataDiff(srcconn, dstconn)
        
        for srcschema, srctable, dstschema, dsttable in self.tables():
            print('-- Diff from [%s] %s.%s to [%s] %s.%s' % (
                self.args.src, srcschema, srctable,
                self.args.dst, dstschema, dsttable))
            
            if self.args.rowcount:
                with self.pgm.cursor('src') as curs:
                    curs.execute('''SELECT count(*) FROM "%s"."%s"''' % (srcschema, srctable))
                    srccount = curs.fetchone()[0]
                with self.pgm.cursor('dst') as curs:
                    curs.execute('''SELECT count(*) FROM "%s"."%s"''' % (dstschema, dsttable))
                    dstcount = curs.fetchone()[0]
                if srccount != dstcount:
                    print(highlight(1, BOLD | YELLOW), "Row count differs: src=%s dst=%s" % (srccount, dstcount), highlight(0), sep='')
                continue
            
            dd.settable1(srctable, srcschema)
            dd.settable2(dsttable, dstschema)
            
            if self.args.sql:
                dd.print_patch()
            else:
                dd.print_diff()


tool = TableDiffTool()
tool.main()