[#6734] Add script for timing/profiling discussion-thread rendering Signed-off-by: Tim Van Steenburgh <tvansteenburgh@gmail.com>

commit: 8b0b86babc319188d58898f79e24e9bdc119deba [log] [tgz]
author: Tim Van Steenburgh <tvansteenburgh@gmail.com> Thu Oct 03 18:41:26 2013 +0000
committer: Tim Van Steenburgh <tvansteenburgh@gmail.com> Thu Oct 03 18:41:26 2013 +0000
tree: c015a5cc838761218b75251c658cf0544c2c7619
parent: c14b91aeed43ecdae266d5fcb7b826d3588d8a81 [diff]
diff --git a/Allura/allura/scripts/md_perf.py b/Allura/allura/scripts/md_perf.py
new file mode 100644
index 0000000..503c70d
--- /dev/null
+++ b/Allura/allura/scripts/md_perf.py

@@ -0,0 +1,113 @@
+"""
+A script for timing/profiling the Markdown conversion of an artifact discussion thread.
+
+Example usage:
+
+(env-allura)root@h1v1024:/var/local/allura/Allura(master)$ time paster script production.ini allura/scripts/md_perf.py -- --converter=forge
+      Conversion Time (s)  Text Size Post._id
+   1 0.021863937377929688         20 7d3ce86bb2c3afaee21f28547ed542d0c8c483b8
+   2 0.002238035202026367         12 96b1283c6db619cd66ee092551758dc1ad5b958f
+   3 0.001832962036132812          9 42c44cd72815d29069378353745bef953bdb2b98
+   4 0.011796951293945312        901 cadbea52291c58bb190597c1df94527369b405fa
+   5 0.143218040466308594      11018 362bee7ef1ba4e062712bda22cb96ae9fe459b95
+   6 0.029596090316772461       1481 46b78785b849f55d24cf32ee1f4e4c916cb7a6fe
+   7 0.045151948928833008       4144 4e2f62188080baba9b88c045ba1f7c26903bfcf9
+   8 0.637056827545166016      14553 51c87f2b1d55c08147bb2353e20361236232b432
+   9 4.510329008102416992      23016 f298ad88584f3dc9b5c37ffde61391bf03d5bae6
+  10 3.614714860916137695      23016 8775a230b19c231daa1608bb4cea1e17aab54550
+  11 0.393079042434692383      19386 ed79e0d2f89366043a007e0837e98945453508c9
+  12 0.000739097595214844      43659 56ac2437ec1bd886a03d23e45aa1c947729760ec
+  13 0.258469104766845703       8520 57152cefe0424b7fc9dff7ab4d21a6ef6e90bf82
+  14 0.264052867889404297       8518 6788b13c90c9719ba46196a0a773f4c228df9f2a
+  15 0.995774984359741211      14553 3f5cce06d2400bcd56d7b90d12c569935f0099a4
+Total time: 10.930670023
+
+real    0m14.256s
+user    0m12.749s
+sys     0m1.112s
+
+"""
+
+import argparse
+import cProfile
+import re
+import sys
+import time
+
+from mock import patch
+
+try:
+    import re2
+    re2.set_fallback_notification(re2.FALLBACK_WARNING)
+    RE2_INSTALLED = True
+except ImportError:
+    RE2_INSTALLED = False
+
+from pylons import app_globals as g
+
+MAX_OUTPUT = 99999
+DUMMYTEXT = None
+
+
+def get_artifact():
+    from forgeblog import model as BM
+    return BM.BlogPost.query.get(
+            slug='2013/09/watch-breaking-bad-season-5-episode-16-felina-live-streaming')
+
+
+def main(opts):
+    import markdown
+    if opts.re2 and RE2_INSTALLED:
+        markdown.inlinepatterns.re = re2
+    converters = {
+        'markdown': lambda: markdown.Markdown(),
+        'markdown_safe': lambda: markdown.Markdown(safe_mode=True),
+        'markdown_escape': lambda: markdown.Markdown(safe_mode='escape'),
+        'forge': lambda: g.markdown,
+        }
+    md = converters[opts.converter]()
+    artifact = get_artifact()
+    return render(artifact, md, opts)
+
+
+def render(artifact, md, opts):
+    start = begin = time.time()
+    print "%4s %20s %10s %s" % ('', 'Conversion Time (s)', 'Text Size', 'Post._id')
+    for i, p in enumerate(artifact.discussion_thread.posts):
+        text = DUMMYTEXT or p.text
+        if opts.n and i + 1 not in opts.n:
+            print 'Skipping post %s' % str(i + 1)
+            continue
+        if opts.profile:
+            print 'Profiling post %s' % str(i + 1)
+            cProfile.runctx('output = md.convert(text)', globals(), locals())
+        else:
+            output = md.convert(text)
+        elapsed = time.time() - start
+        print "%4s %1.18f %10s %s" % (i + 1, elapsed, len(text), p._id)
+        if opts.output:
+            print 'Input:', text[:min(300, len(text))]
+            print 'Output:', output[:min(MAX_OUTPUT, len(output))]
+        start = time.time()
+    print "Total time:", start - begin
+    return output
+
+
+def parse_options():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--converter', default='markdown')
+    parser.add_argument('--profile', action='store_true', help='Run profiler and output timings')
+    parser.add_argument('--output', action='store_true', help='Print result of markdown conversion')
+    parser.add_argument('--re2', action='store_true', help='Run with re2 instead of re')
+    parser.add_argument('--compare', action='store_true', help='Run with re and re2, and compare results')
+    parser.add_argument('-n', '--n', nargs='+', type=int, help='Only convert nth post(s) in thread')
+    return parser.parse_args()
+
+
+if __name__ == '__main__':
+    opts = parse_options()
+    out1 = main(opts)
+    if opts.compare:
+        opts.re2 = not opts.re2
+        out2 = main(opts)
+        print 're/re2 outputs match: ', out1 == out2
commit	8b0b86babc319188d58898f79e24e9bdc119deba	[log] [tgz]
author	Tim Van Steenburgh <tvansteenburgh@gmail.com>	Thu Oct 03 18:41:26 2013 +0000
committer	Tim Van Steenburgh <tvansteenburgh@gmail.com>	Thu Oct 03 18:41:26 2013 +0000
tree	c015a5cc838761218b75251c658cf0544c2c7619
parent	c14b91aeed43ecdae266d5fcb7b826d3588d8a81 [diff]