1
0
mirror of https://github.com/djohnlewis/stackdump synced 2025-01-22 14:41:39 +00:00

Fixed a bug where uncommitted entries from a previously failed import were committed in a later, successful import.

This commit is contained in:
Samuel Lai 2012-08-12 16:31:30 +10:00
parent 1f29fd9113
commit 3944261eef
2 changed files with 23 additions and 1 deletions

View File

@ -588,7 +588,7 @@ dump_date = cmd_options.dump_date
readme_path = os.path.join(xml_root, 'readme.txt')
if not (site_name and dump_date) and os.path.exists(readme_path):
# get the site name from the first line of readme.txt. This could be fragile.
with open() as f:
with open(readme_path, 'r') as f:
site_readme_desc = f.readline().strip()
# assume if there's a colon in the name, the name part is before, and the date
@ -673,6 +673,17 @@ if site_key in ('search', 'import', 'media', 'licenses'):
print 'Use the --site-key parameter to specify an alternate site key.'
sys.exit(2)
# rollback any uncommitted entries in solr. Uncommitted entries may occur if
# this import process is aborted. Solr doesn't have the concept of transactions
# like databases do, so without a rollback, we'll be committing the previously
# uncommitted entries plus the newly imported ones.
#
# This also means multiple dataproc processes cannot occur concurrently. If you
# do the import will be silently incomplete.
print('Clearing any uncommitted entries in solr...')
solr._update('<rollback />', waitFlush=None, waitSearcher=None)
print('Cleared.\n')
# check if site is already in database; if so, purge the data.
site = list(Site.select(Site.q.key==site_key))
if len(site) > 0:

View File

@ -66,6 +66,17 @@ def delete_site(site_key):
sqlhub.threadConnection.commit(close=True)
# rollback any uncommitted entries in solr. Uncommitted entries may occur if
# the import process is aborted. Solr doesn't have the concept of
# transactions like databases do, so without a rollback, we'll be committing
# the previously uncommitted entries plus the newly imported ones.
#
# This also means multiple dataproc processes cannot occur concurrently. If
# you do the import will be silently incomplete.
print('Clearing any uncommitted entries in solr...')
solr._update('<rollback />', waitFlush=None, waitSearcher=None)
print('Cleared.\n')
if site_name:
print('Deleting site "%s" from solr... ' % site_name)
else: