Allura/allura/command/show_models.py - allura - Git at Google

 import sys
 from collections import defaultdict
 from itertools import groupby

 from pylons import c, g
 from pymongo.errors import DuplicateKeyError

 from ming.orm import mapper, session, Mapper
 from ming.orm.declarative import MappedClass

 import allura.tasks.index_tasks
 from allura.lib.exceptions import CompoundError
 from allura.lib import utils
 from . import base

 class ShowModelsCommand(base.Command):
     min_args=1
     max_args=1
     usage = '<ini file>'
     summary = 'Show the inheritance graph of all Ming models'
     parser = base.Command.standard_parser(verbose=True)

     def command(self):
         self.basic_setup()
         graph = build_model_inheritance_graph()
         for depth, cls in dfs(MappedClass, graph):
             for line in dump_cls(depth, cls):
                 print line

 class ReindexCommand(base.Command):
     min_args=1
     max_args=1
     usage = '<ini file>'
     summary = 'Reindex and re-shortlink all artifacts'
     parser = base.Command.standard_parser(verbose=True)
     parser.add_option('-p', '--project', dest='project',  default=None,
                       help='project to reindex')
     parser.add_option('--mount_point', dest='mount_point',  default=None,
                       help='limit to this mount point (only use with --solr)')
     parser.add_option('-n', '--neighborhood', dest='neighborhood', default=None,
                       help='neighborhood to reindex (e.g. p)')

     parser.add_option('--solr', action='store_true', dest='solr',
                       help='Solr needs artifact references to already exist.')
     parser.add_option('--refs', action='store_true', dest='refs',
                       help='Update artifact references and shortlinks')

     def command(self):
         from allura import model as M
         self.basic_setup()
         graph = build_model_inheritance_graph()
         if self.options.project:
             q_project = dict(shortname=self.options.project)
         elif self.options.neighborhood:
             neighborhood_id = M.Neighborhood.query.get(
                 url_prefix='/%s/' % self.options.neighborhood)._id
             q_project = dict(neighborhood_id=neighborhood_id)
         else:
             q_project = {}

         # if none specified, do all
         if not self.options.solr and not self.options.refs:
             self.options.solr = self.options.refs = True

         for projects in utils.chunked_find(M.Project, q_project):
             for p in projects:
                 c.project = p
                 base.log.info('Reindex project %s', p.shortname)
                 # Clear index for this project
                 if self.options.solr:
                     g.solr.delete(q='project_id_s:%s' % p._id)
                 if self.options.refs:
                     M.ArtifactReference.query.remove({'artifact_reference.project_id':p._id})
                     M.Shortlink.query.remove({'project_id':p._id})
                 app_config_ids = [ac._id for ac in p.app_configs
                                   if not self.options.mount_point
                                   or self.options.mount_point == ac.options.mount_point]
                 # Traverse the inheritance graph, finding all artifacts that
                 # belong to this project
                 for _, a_cls in dfs(M.Artifact, graph):
                     base.log.info('  %s', a_cls)
                     ref_ids = []
                     # Create artifact references and shortlinks
                     for a in a_cls.query.find(dict(app_config_id={'$in': app_config_ids})):
                         if self.options.verbose:
                             base.log.info('      %s', a.shorthand_id())
                         if self.options.refs:
                             try:
                                 M.ArtifactReference.from_artifact(a)
                                 M.Shortlink.from_artifact(a)
                             except:
                                 base.log.exception('Making ArtifactReference/Shortlink from %s', a)
                                 continue
                         ref_ids.append(a.index_id())
                     M.main_orm_session.flush()
                     M.artifact_orm_session.clear()
                     try:
                         if self.options.verbose:
                             base.log.info('adding artifacts: %s' % ref_ids)
                         allura.tasks.index_tasks.add_artifacts(ref_ids,
                                                                update_solr=self.options.solr,
                                                                update_refs=self.options.refs,
                                                                verbose=self.options.verbose)
                     except CompoundError, err:
                         base.log.exception('Error indexing artifacts:\n%r', err)
                         base.log.error('%s', err.format_error())
                     M.main_orm_session.flush()
                     M.main_orm_session.clear()
         base.log.info('Reindex done')

 class EnsureIndexCommand(base.Command):
     min_args=1
     max_args=1
     usage = '[<ini file>]'
     summary = 'Run ensure_index on all mongo objects'
     parser = base.Command.standard_parser(verbose=True)

     def command(self):
         from allura import model as M
         self.basic_setup()
         # Collect indexes by collection name
         main_indexes = defaultdict(list)
         project_indexes = defaultdict(list)
         base.log.info('Collecting indexes...')
         for m in Mapper.all_mappers():
             mgr = m.collection.m
             cname = mgr.collection_name
             cls = m.mapped_class
             if cname is None:
                 base.log.info('... skipping abstract class %s', cls)
                 continue
             base.log.info('... for class %s', cls)
             if session(cls) in (
                 M.main_orm_session, M.repository_orm_session):
                 idx = main_indexes[cname]
             else:
                 idx = project_indexes[cname]
             idx.extend(mgr.indexes)
         base.log.info('Updating indexes for main DB')
         db = M.main_doc_session.db
         for name, indexes in main_indexes.iteritems():
             self._update_indexes(db[name], indexes)
         base.log.info('Updating indexes for project DBs')
         configured_dbs = set()
         for projects in utils.chunked_find(M.Project):
             for p in projects:
                 db = p.database_uri
                 if db in configured_dbs: continue
                 configured_dbs.add(db)
                 c.project = p
                 db = M.project_doc_session.db
                 base.log.info('... DB: %s', db)
                 for name, indexes in project_indexes.iteritems():
                     self._update_indexes(db[name], indexes)
         if not configured_dbs:
             # e.g. during bootstrap with no projects
             db = M.project_doc_session.db
             base.log.info('... default DB: %s', db)
             for name, indexes in project_indexes.iteritems():
                 self._update_indexes(db[name], indexes)
         base.log.info('Done updating indexes')

     def _update_indexes(self, collection, indexes):
         uindexes = dict(
             (tuple(i.index_spec), i)  # convert list to tuple so it's hashable for 'set'
             for i in indexes
             if i.unique)
         indexes = dict(
             (tuple(i.index_spec), i)
             for i in indexes
             if not i.unique)
         prev_indexes = {}
         prev_uindexes = {}
         unique_flag_drop = {}
         unique_flag_add = {}
         for iname, fields in collection.index_information().iteritems():
             if iname == '_id_':
                 continue
             keys = tuple(fields['key'])
             if fields.get('unique'):
                 if keys in indexes:
                     unique_flag_drop[iname] = keys
                 else:
                     prev_uindexes[iname] = keys
             else:
                 if keys in uindexes:
                     unique_flag_add[iname] = keys
                 else:
                     prev_indexes[iname] = keys

         for iname, keys in unique_flag_drop.iteritems():
             self._recreate_index(collection, iname, list(keys), unique=False)
         for iname, keys in unique_flag_add.iteritems():
             self._recreate_index(collection, iname, list(keys), unique=True)

         # Ensure all indexes
         for keys, idx in uindexes.iteritems():
             base.log.info('...... ensure %s:%s', collection.name, idx)
             while True:
                 try:
                     collection.ensure_index(idx.index_spec, unique=True)
                     break
                 except DuplicateKeyError, err:
                     base.log.info('Found dupe key(%s), eliminating dupes', err)
                     self._remove_dupes(collection, idx.index_spec)
         for keys, idx in indexes.iteritems():
             base.log.info('...... ensure %s:%s', collection.name, idx)
             collection.ensure_index(idx.index_spec, background=True)
         # Drop obsolete indexes
         for iname, keys in prev_indexes.iteritems():
             if keys not in indexes:
                 base.log.info('...... drop index %s:%s', collection.name, iname)
                 collection.drop_index(iname)
         for iname, keys in prev_uindexes.iteritems():
             if keys not in uindexes:
                 base.log.info('...... drop index %s:%s', collection.name, iname)
                 collection.drop_index(iname)

     def _recreate_index(self, collection, iname, keys, **creation_options):
         '''Recreate an index with new creation options, using a temporary index
         so that at no time is an index missing from the specified keys'''
         superset_keys = keys + [('temporary_extra_field_for_indexing', 1)]
         base.log.info('...... ensure index %s:%s', collection.name, superset_keys)
         superset_index = collection.ensure_index(superset_keys)
         base.log.info('...... drop index %s:%s', collection.name, iname)
         collection.drop_index(iname)
         base.log.info('...... ensure index %s:%s %s', collection.name, keys, creation_options)
         collection.ensure_index(keys, **creation_options)
         base.log.info('...... drop index %s:%s', collection.name, superset_index)
         collection.drop_index(superset_index)

     def _remove_dupes(self, collection, spec):
         iname = collection.create_index(spec)
         fields = [ f[0] for f in spec ]
         q = collection.find({}, fields=fields).sort(spec)
         def keyfunc(doc):
             return tuple(doc.get(f, None) for f in fields)
         dupes = []
         for key, doc_iter in groupby(q, key=keyfunc):
             docs = list(doc_iter)
             if len(docs) > 1:
                 base.log.info('Found dupes with %s', key)
                 dupes += [ doc['_id'] for doc in docs[1:] ]
         collection.drop_index(iname)
         collection.remove(dict(_id={'$in':dupes}))

 def build_model_inheritance_graph():
     graph = dict((m.mapped_class, ([], [])) for m in Mapper.all_mappers())
     for cls, (parents, children)  in graph.iteritems():
         for b in cls.__bases__:
             if b not in graph: continue
             parents.append(b)
             graph[b][1].append(cls)
     return graph

 def dump_cls(depth, cls):
     indent = ' '*4*depth
     yield indent + '%s.%s' % (cls.__module__, cls.__name__)
     m = mapper(cls)
     for p in m.properties:
         s = indent*2 + ' - ' + str(p)
         if hasattr(p, 'field_type'):
             s += ' (%s)' % p.field_type
         yield s

 def dfs(root, graph, depth=0):
     yield depth, root
     for c in graph[root][1]:
         for r in dfs(c, graph, depth+1):
             yield r


 def pm(etype, value, tb): # pragma no cover
     import pdb, traceback
     try:
         from IPython.ipapi import make_session; make_session()
         from IPython.Debugger import Pdb
         sys.stderr.write('Entering post-mortem IPDB shell\n')
         p = Pdb(color_scheme='Linux')
         p.reset()
         p.setup(None, tb)
         p.print_stack_trace()
         sys.stderr.write('%s: %s\n' % ( etype, value))
         p.cmdloop()
         p.forget()
         # p.interaction(None, tb)
     except ImportError:
         sys.stderr.write('Entering post-mortem PDB shell\n')
         traceback.print_exception(etype, value, tb)
         pdb.post_mortem(tb)
	import sys
	from collections import defaultdict
	from itertools import groupby

	from pylons import c, g
	from pymongo.errors import DuplicateKeyError

	from ming.orm import mapper, session, Mapper
	from ming.orm.declarative import MappedClass

	import allura.tasks.index_tasks
	from allura.lib.exceptions import CompoundError
	from allura.lib import utils
	from . import base

	class ShowModelsCommand(base.Command):
	min_args=1
	max_args=1
	usage = '<ini file>'
	summary = 'Show the inheritance graph of all Ming models'
	parser = base.Command.standard_parser(verbose=True)

	def command(self):
	self.basic_setup()
	graph = build_model_inheritance_graph()
	for depth, cls in dfs(MappedClass, graph):
	for line in dump_cls(depth, cls):
	print line

	class ReindexCommand(base.Command):
	min_args=1
	max_args=1
	usage = '<ini file>'
	summary = 'Reindex and re-shortlink all artifacts'
	parser = base.Command.standard_parser(verbose=True)
	parser.add_option('-p', '--project', dest='project', default=None,
	help='project to reindex')
	parser.add_option('--mount_point', dest='mount_point', default=None,
	help='limit to this mount point (only use with --solr)')
	parser.add_option('-n', '--neighborhood', dest='neighborhood', default=None,
	help='neighborhood to reindex (e.g. p)')

	parser.add_option('--solr', action='store_true', dest='solr',
	help='Solr needs artifact references to already exist.')
	parser.add_option('--refs', action='store_true', dest='refs',
	help='Update artifact references and shortlinks')

	def command(self):
	from allura import model as M
	self.basic_setup()
	graph = build_model_inheritance_graph()
	if self.options.project:
	q_project = dict(shortname=self.options.project)
	elif self.options.neighborhood:
	neighborhood_id = M.Neighborhood.query.get(
	url_prefix='/%s/' % self.options.neighborhood)._id
	q_project = dict(neighborhood_id=neighborhood_id)
	else:
	q_project = {}

	# if none specified, do all
	if not self.options.solr and not self.options.refs:
	self.options.solr = self.options.refs = True

	for projects in utils.chunked_find(M.Project, q_project):
	for p in projects:
	c.project = p
	base.log.info('Reindex project %s', p.shortname)
	# Clear index for this project
	if self.options.solr:
	g.solr.delete(q='project_id_s:%s' % p._id)
	if self.options.refs:
	M.ArtifactReference.query.remove({'artifact_reference.project_id':p._id})
	M.Shortlink.query.remove({'project_id':p._id})
	app_config_ids = [ac._id for ac in p.app_configs
	if not self.options.mount_point
	or self.options.mount_point == ac.options.mount_point]
	# Traverse the inheritance graph, finding all artifacts that
	# belong to this project
	for _, a_cls in dfs(M.Artifact, graph):
	base.log.info(' %s', a_cls)
	ref_ids = []
	# Create artifact references and shortlinks
	for a in a_cls.query.find(dict(app_config_id={'$in': app_config_ids})):
	if self.options.verbose:
	base.log.info(' %s', a.shorthand_id())
	if self.options.refs:
	try:
	M.ArtifactReference.from_artifact(a)
	M.Shortlink.from_artifact(a)
	except:
	base.log.exception('Making ArtifactReference/Shortlink from %s', a)
	continue
	ref_ids.append(a.index_id())
	M.main_orm_session.flush()
	M.artifact_orm_session.clear()
	try:
	if self.options.verbose:
	base.log.info('adding artifacts: %s' % ref_ids)
	allura.tasks.index_tasks.add_artifacts(ref_ids,
	update_solr=self.options.solr,
	update_refs=self.options.refs,
	verbose=self.options.verbose)
	except CompoundError, err:
	base.log.exception('Error indexing artifacts:\n%r', err)
	base.log.error('%s', err.format_error())
	M.main_orm_session.flush()
	M.main_orm_session.clear()
	base.log.info('Reindex done')

	class EnsureIndexCommand(base.Command):
	min_args=1
	max_args=1
	usage = '[<ini file>]'
	summary = 'Run ensure_index on all mongo objects'
	parser = base.Command.standard_parser(verbose=True)

	def command(self):
	from allura import model as M
	self.basic_setup()
	# Collect indexes by collection name
	main_indexes = defaultdict(list)
	project_indexes = defaultdict(list)
	base.log.info('Collecting indexes...')
	for m in Mapper.all_mappers():
	mgr = m.collection.m
	cname = mgr.collection_name
	cls = m.mapped_class
	if cname is None:
	base.log.info('... skipping abstract class %s', cls)
	continue
	base.log.info('... for class %s', cls)
	if session(cls) in (
	M.main_orm_session, M.repository_orm_session):
	idx = main_indexes[cname]
	else:
	idx = project_indexes[cname]
	idx.extend(mgr.indexes)
	base.log.info('Updating indexes for main DB')
	db = M.main_doc_session.db
	for name, indexes in main_indexes.iteritems():
	self._update_indexes(db[name], indexes)
	base.log.info('Updating indexes for project DBs')
	configured_dbs = set()
	for projects in utils.chunked_find(M.Project):
	for p in projects:
	db = p.database_uri
	if db in configured_dbs: continue
	configured_dbs.add(db)
	c.project = p
	db = M.project_doc_session.db
	base.log.info('... DB: %s', db)
	for name, indexes in project_indexes.iteritems():
	self._update_indexes(db[name], indexes)
	if not configured_dbs:
	# e.g. during bootstrap with no projects
	db = M.project_doc_session.db
	base.log.info('... default DB: %s', db)
	for name, indexes in project_indexes.iteritems():
	self._update_indexes(db[name], indexes)
	base.log.info('Done updating indexes')

	def _update_indexes(self, collection, indexes):
	uindexes = dict(
	(tuple(i.index_spec), i) # convert list to tuple so it's hashable for 'set'
	for i in indexes
	if i.unique)
	indexes = dict(
	(tuple(i.index_spec), i)
	for i in indexes
	if not i.unique)
	prev_indexes = {}
	prev_uindexes = {}
	unique_flag_drop = {}
	unique_flag_add = {}
	for iname, fields in collection.index_information().iteritems():
	if iname == '_id_':
	continue
	keys = tuple(fields['key'])
	if fields.get('unique'):
	if keys in indexes:
	unique_flag_drop[iname] = keys
	else:
	prev_uindexes[iname] = keys
	else:
	if keys in uindexes:
	unique_flag_add[iname] = keys
	else:
	prev_indexes[iname] = keys

	for iname, keys in unique_flag_drop.iteritems():
	self._recreate_index(collection, iname, list(keys), unique=False)
	for iname, keys in unique_flag_add.iteritems():
	self._recreate_index(collection, iname, list(keys), unique=True)

	# Ensure all indexes
	for keys, idx in uindexes.iteritems():
	base.log.info('...... ensure %s:%s', collection.name, idx)
	while True:
	try:
	collection.ensure_index(idx.index_spec, unique=True)
	break
	except DuplicateKeyError, err:
	base.log.info('Found dupe key(%s), eliminating dupes', err)
	self._remove_dupes(collection, idx.index_spec)
	for keys, idx in indexes.iteritems():
	base.log.info('...... ensure %s:%s', collection.name, idx)
	collection.ensure_index(idx.index_spec, background=True)
	# Drop obsolete indexes
	for iname, keys in prev_indexes.iteritems():
	if keys not in indexes:
	base.log.info('...... drop index %s:%s', collection.name, iname)
	collection.drop_index(iname)
	for iname, keys in prev_uindexes.iteritems():
	if keys not in uindexes:
	base.log.info('...... drop index %s:%s', collection.name, iname)
	collection.drop_index(iname)

	def _recreate_index(self, collection, iname, keys, **creation_options):
	'''Recreate an index with new creation options, using a temporary index
	so that at no time is an index missing from the specified keys'''
	superset_keys = keys + [('temporary_extra_field_for_indexing', 1)]
	base.log.info('...... ensure index %s:%s', collection.name, superset_keys)
	superset_index = collection.ensure_index(superset_keys)
	base.log.info('...... drop index %s:%s', collection.name, iname)
	collection.drop_index(iname)
	base.log.info('...... ensure index %s:%s %s', collection.name, keys, creation_options)
	collection.ensure_index(keys, **creation_options)
	base.log.info('...... drop index %s:%s', collection.name, superset_index)
	collection.drop_index(superset_index)

	def _remove_dupes(self, collection, spec):
	iname = collection.create_index(spec)
	fields = [ f[0] for f in spec ]
	q = collection.find({}, fields=fields).sort(spec)
	def keyfunc(doc):
	return tuple(doc.get(f, None) for f in fields)
	dupes = []
	for key, doc_iter in groupby(q, key=keyfunc):
	docs = list(doc_iter)
	if len(docs) > 1:
	base.log.info('Found dupes with %s', key)
	dupes += [ doc['_id'] for doc in docs[1:] ]
	collection.drop_index(iname)
	collection.remove(dict(_id={'$in':dupes}))

	def build_model_inheritance_graph():
	graph = dict((m.mapped_class, ([], [])) for m in Mapper.all_mappers())
	for cls, (parents, children) in graph.iteritems():
	for b in cls.__bases__:
	if b not in graph: continue
	parents.append(b)
	graph[b][1].append(cls)
	return graph

	def dump_cls(depth, cls):
	indent = ' '4depth
	yield indent + '%s.%s' % (cls.__module__, cls.__name__)
	m = mapper(cls)
	for p in m.properties:
	s = indent*2 + ' - ' + str(p)
	if hasattr(p, 'field_type'):
	s += ' (%s)' % p.field_type
	yield s

	def dfs(root, graph, depth=0):
	yield depth, root
	for c in graph[root][1]:
	for r in dfs(c, graph, depth+1):
	yield r


	def pm(etype, value, tb): # pragma no cover
	import pdb, traceback
	try:
	from IPython.ipapi import make_session; make_session()
	from IPython.Debugger import Pdb
	sys.stderr.write('Entering post-mortem IPDB shell\n')
	p = Pdb(color_scheme='Linux')
	p.reset()
	p.setup(None, tb)
	p.print_stack_trace()
	sys.stderr.write('%s: %s\n' % ( etype, value))
	p.cmdloop()
	p.forget()
	# p.interaction(None, tb)
	except ImportError:
	sys.stderr.write('Entering post-mortem PDB shell\n')
	traceback.print_exception(etype, value, tb)
	pdb.post_mortem(tb)