# encoding: utf8
import sys
+from sqlalchemy.exc import IntegrityError
import sqlalchemy.types
from .db import connect, metadata, tables as tables_module
from sqlalchemy.orm.attributes import instrumentation_registry
- session = connect(engine_uri)
+ # Use autocommit in case rows fail due to foreign key incest
+ session = connect(engine_uri, autocommit=True, autoflush=False)
metadata.create_all()
# Print the table name but leave the cursor in a fixed column
print table_name + '...', ' ' * (40 - len(table_name)),
+ sys.stdout.flush()
try:
csvfile = open("%s/%s.csv" % (directory, table_name), 'rb')
reader = csv.reader(csvfile, lineterminator='\n')
column_names = [unicode(column) for column in reader.next()]
+ # Self-referential tables may contain rows with foreign keys of
+ # other rows in the same table that do not yet exist. We'll keep
+ # a running list of these and try inserting them again after the
+ # rest are done
+ failed_rows = []
+
for csvs in reader:
row = table_class()
setattr(row, column_name, value)
- session.add(row)
-
- session.commit()
- print 'loaded'
-
+ try:
+ session.add(row)
+ session.flush()
+ except IntegrityError as e:
+ failed_rows.append(row)
+
+ # Loop over the failed rows and keep trying to insert them. If a loop
+ # doesn't manage to insert any rows, bail.
+ do_another_loop = True
+ while failed_rows and do_another_loop:
+ do_another_loop = False
+
+ for i, row in enumerate(failed_rows):
+ try:
+ session.add(row)
+ session.flush()
+
+ # Success!
+ del failed_rows[i]
+ do_another_loop = True
+ except IntegrityError as e:
+ pass
+
+ if failed_rows:
+ print len(failed_rows), "rows failed"
+ else:
+ print 'loaded'
def csvexport(engine_uri, directory='.'):
import csv