added progress bars to the SE importer and improved progress bar printing

author: Evgeny Fadeev <evgeny.fadeev@gmail.com> 2012-11-14 21:02:02 -0300
committer: Evgeny Fadeev <evgeny.fadeev@gmail.com> 2012-11-14 21:02:02 -0300
commit: 8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8 (patch)
tree: 5de0114ccfe3cc1983985b1aeb40736e1f473630
parent: 58a3f9d367b2d0a95624bc31e865863e8da02714 (diff)
download: askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.tar.gz
askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.tar.bz2
askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.zip
2 files changed, 57 insertions, 28 deletions
diff --git a/askbot/importers/stackexchange/management/commands/load_stackexchange.py b/askbot/importers/stackexchange/management/commands/load_stackexchange.py
index 313bab13..a021b62d 100644
--- a/askbot/importers/stackexchange/management/commands/load_stackexchange.py
+++ b/askbot/importers/stackexchange/management/commands/load_stackexchange.py
@@ -1,5 +1,5 @@
 #todo: http://stackoverflow.com/questions/837828/how-to-use-a-slug-in-django 
-DEBUGME = False 
+DEBUGME = False
 import os
 import re
 import sys
@@ -38,7 +38,8 @@ if DEBUGME == True:
     from askbot.utils import dummy_transaction as transaction
     HEAP = hpy()
 else:
-    from django.db import transaction
+    #from django.db import transaction
+    from askbot.utils import dummy_transaction as transaction
 
 xml_read_order = (
         'VoteTypes','UserTypes','Users','Users2Votes',
@@ -315,7 +316,8 @@ it may be helpful to split this procedure in two:\n
 
         if django_settings.DEBUG:
             raise CommandError(
-                'Please set DEBUG to False in the settings.py to reduce RAM usage'
+                'Please set DEBUG to False in the settings.py to reduce '
+                'RAM usage during the import process'
             )
 
         #process the command line arguments, if given
@@ -368,36 +370,36 @@ it may be helpful to split this procedure in two:\n
         self.save_askbot_message_id_list()
 
         #transfer data into ASKBOT tables
-        print 'Transferring users...',
+        print 'Transferring users...'
         self.transfer_users()
         transaction.commit()
         print 'done.'
-        print 'Transferring content edits...',
+        print 'Transferring content edits...'
         sys.stdout.flush()
         self.transfer_question_and_answer_activity()
         transaction.commit()
         print 'done.'
-        print 'Transferring view counts...',
+        print 'Transferring view counts...'
         sys.stdout.flush()
         self.transfer_question_view_counts()
         transaction.commit()
         print 'done.'
-        print 'Transferring comments...',
+        print 'Transferring comments...'
         sys.stdout.flush()
         self.transfer_comments()
         transaction.commit()
         print 'done.'
-        print 'Transferring badges and badge awards...',
+        print 'Transferring badges and badge awards...'
         sys.stdout.flush()
         self.transfer_badges()
         transaction.commit()
         print 'done.'
-        print 'Transferring Q&A votes...',
+        print 'Transferring Q&A votes...'
         sys.stdout.flush()
         self.transfer_QA_votes()#includes favorites, accepts and flags
         transaction.commit()
         print 'done.'
-        print 'Transferring comment votes...',
+        print 'Transferring comment votes...'
         sys.stdout.flush()
         self.transfer_comment_votes()
         transaction.commit()
@@ -444,7 +446,8 @@ it may be helpful to split this procedure in two:\n
         """transfers some messages from
         SE to ASKBOT
         """
-        for m in se.Message.objects.all().iterator():
+        messages = se.Message.objects.all()
+        for m in ProgressBar(messages.iterator(), messages.count()):
             if m.is_read:
                 continue
             if m.user is None:
@@ -707,7 +710,8 @@ it may be helpful to split this procedure in two:\n
             self._process_post_revision_group(c_group)
 
     def transfer_comments(self):
-        for se_c in se.PostComment.objects.all().iterator():
+        comments = se.PostComment.objects.all()
+        for se_c in ProgressBar(comments.iterator(), comments.count()):
             if se_c.deletion_date:
                 print 'Warning deleted comment %d dropped' % se_c.id
                 sys.stdout.flush()
@@ -730,7 +734,9 @@ it may be helpful to split this procedure in two:\n
 
     def _collect_missing_badges(self):
         self._missing_badges = {}
-        for se_b in se.Badge.objects.all():
+        badges = se.Badge.objects.all()
+        message = 'Collecting missing badges'
+        for se_b in ProgressBar(badges.iterator(), badges.count(), message):
             name = X.get_badge_name(se_b.name)
             try:
                 #todo: query badge from askbot.models.badges
@@ -747,7 +753,9 @@ it may be helpful to split this procedure in two:\n
     def _award_badges(self):
         #note: SE does not keep information on
         #content-related badges like askbot does
-        for se_a in se.User2Badge.objects.all().iterator():
+        badges = se.User2Badge.objects.all()
+        message = 'Awarding badges'
+        for se_a in ProgressBar(badges.iterator(), badges.count(), message):
             if se_a.user.id == -1:
                 continue #skip community user
             u = USER[se_a.user.id]
@@ -790,7 +798,8 @@ it may be helpful to split this procedure in two:\n
         pass
 
     def transfer_question_view_counts(self):
-        for se_q in se.Post.objects.filter(post_type__name='Question').iterator():
+        questions = se.Post.objects.filter(post_type__name='Question')
+        for se_q in ProgressBar(questions.iterator(), questions.count()):
             q = X.get_post(se_q)
             if q is None:
                 continue
@@ -799,7 +808,8 @@ it may be helpful to split this procedure in two:\n
 
 
     def transfer_QA_votes(self):
-        for v in se.Post2Vote.objects.all().iterator():
+        votes = se.Post2Vote.objects.all()
+        for v in ProgressBar(votes.iterator(), votes.count()):
             vote_type = v.vote_type.name
             if not vote_type in X.vote_actions:
                 continue
@@ -826,7 +836,8 @@ it may be helpful to split this procedure in two:\n
             transaction.commit()
 
     def transfer_comment_votes(self):
-        for v in se.Comment2Vote.objects.all().iterator():
+        votes = se.Comment2Vote.objects.all()
+        for v in ProgressBar(votes.iterator(), votes.count()):
             vote_type = v.vote_type.name
             if vote_type not in ('UpMod', 'Offensive'):
                 continue
@@ -869,10 +880,11 @@ it may be helpful to split this procedure in two:\n
         xml_data = self.zipfile.read(xml_path)
 
         tree = et.fromstring(xml_data)
-        print 'loading from %s to %s' % (xml_path, table_name) ,
+        print 'loading from %s to %s' % (xml_path, table_name)
         model = models.get_model('stackexchange', table_name)
         i = 0
-        for row in tree.findall('.//row'):
+        rows = tree.findall('.//row')
+        for row in ProgressBar(iter(rows), len(rows)):
             model_entry = model()
             i += 1
             for col in row.getchildren():
@@ -897,8 +909,7 @@ it may be helpful to split this procedure in two:\n
 
     def transfer_users(self):
         se_users = se.User.objects.all()
-        count = se_users.count()
-        for se_u in ProgressBar(se_users.iterator(), count):
+        for se_u in ProgressBar(se_users.iterator(), se_users.count()):
             #if se_u.id == -1:#skip the Community user
             #    continue
             u = askbot.User()
diff --git a/askbot/utils/console.py b/askbot/utils/console.py
index a691d961..0c27cd23 100644
--- a/askbot/utils/console.py
+++ b/askbot/utils/console.py
@@ -91,7 +91,8 @@ class ProgressBar(object):
         self.iterable = iterable
         self.length = length
         self.counter = float(0)
-        self.barlen = 60
+        self.max_barlen = 60
+        self.curr_barlen = 0
         self.progress = ''
         if message and length > 0:
             print message
@@ -103,17 +104,33 @@ class ProgressBar(object):
     def print_progress_bar(self):
         """prints the progress bar"""
 
-        sys.stdout.write('\b'*len(self.progress))
+        self.backspace_progress_percent()
+
+        tics_to_write = 0
+        if self.length < self.max_barlen:
+            tics_to_write = self.max_barlen/self.length
+        elif int(self.counter) % (self.length/self.max_barlen) == 0:
+            tics_to_write = 1
+
+        if self.curr_barlen + tics_to_write <= self.max_barlen:
+            sys.stdout.write('-' * tics_to_write)
+            self.curr_barlen += tics_to_write
 
-        if self.length < self.barlen:
-            sys.stdout.write('-'*(self.barlen/self.length))
-        elif int(self.counter) % (self.length / self.barlen) == 0:
-            sys.stdout.write('-')
+        self.print_progress_percent()
+
+    def backspace_progress_percent(self):
+        sys.stdout.write('\b'*len(self.progress))
 
+    def print_progress_percent(self):
+        """prints percent of achieved progress"""
         self.progress = ' %.2f%%' % (100 * (self.counter/self.length))
         sys.stdout.write(self.progress)
         sys.stdout.flush()
 
+    def finish_progress_bar(self):
+        """brint the last bars, to make all bars equal length"""
+        self.backspace_progress_percent()
+        sys.stdout.write('-' * (self.max_barlen - self.curr_barlen))
 
     def next(self):
 
@@ -121,7 +138,8 @@ class ProgressBar(object):
             result = self.iterable.next()
         except StopIteration:
             if self.length > 0:
-                self.print_progress_bar()
+                self.finish_progress_bar()
+                self.print_progress_percent()
                 sys.stdout.write('\n')
             raise
author	Evgeny Fadeev <evgeny.fadeev@gmail.com>	2012-11-14 21:02:02 -0300
committer	Evgeny Fadeev <evgeny.fadeev@gmail.com>	2012-11-14 21:02:02 -0300
commit	8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8 (patch)
tree	5de0114ccfe3cc1983985b1aeb40736e1f473630
parent	58a3f9d367b2d0a95624bc31e865863e8da02714 (diff)
download	askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.tar.gz askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.tar.bz2 askbot-8728a90c5b342d16bfa93dc4f2d2e3c75aece0e8.zip