Coverage for runmacs/processor/productBuilder.py: 89%

246 ↛ 247line 246 didn't jump to line 247, because the condition on line 246 was never true if self.rescanProduct is not None and self.rescanProduct.lower() in dp.productClassName().lower():

minQueryRev = -1

try:

componentNames = prototype.componentNames

except AttributeError:

self.buildProduct(prototype, {'_creationRev': {'$gte': minQueryRev}})

else:

for primaryComponent in componentNames:

self.buildProduct(prototype, {'_creationRev': {'$gte': minQueryRev}}, primaryComponent)

minQueryRev = _minQueryRev

self.dbState['completeRev'] = self.inProcessRev

self.db.setObject('__dbState__', self.dbState)

self.rescanProduct = None

class QueryResolutionIterator(object):

def __init__(self, prototype, componentName, component, accessor):

self.prototype = prototype

self.componentName = componentName

self.component = component

self.accessor = accessor

def __iter__(self):

it = iter(self.prototype.tryToAdd(self.componentName, self.component))

needMoreData = False

while True:

try:

if needMoreData:

needMoreData = False

try:

nextData = iter(self.accessor.query(query, limit=limit, sort=sort, batchSize=1)).next()

except StopIteration:

res = it.throw(DataNotFoundError('no matching data found'))

else:

res = it.send(nextData)

else:

res = it.next()

if getattr(res, 'needMoreData', False):

needMoreData = True

query = res.query

sort = None

limit = 1

286 ↛ 269line 286 didn't jump to line 269, because the condition on line 286 was never false if isinstance(query, tuple):

query, queryModifiers = query

288 ↛ 269line 288 didn't jump to line 269, because the condition on line 288 was never false if 'sortBy' in queryModifiers:

sort = queryModifiers['sortBy']

else:

yield res

292 ↛ 294line 292 didn't jump to line 294 except StopIteration:

break

except:

print "error during processing of component %s (%s) for prototype %s"%(self.componentName, self.component.hash, self.prototype)

raise

class CrawlRequest(object):

def __init__(self, folder, base_product, place):

self.folder = folder

self.base_product = base_product

self.place = place

def get_already_imported_files_of(baseclass, registry, accessor, collection=None):

fns = set()

query = {}

if collection is not None:

query["collections"] = collection

for c in registry.find_subclasses(baseclass):

if hasattr(c, 'getCoveredFilenames'):

query["productClass"] = c.productClassName()

for p in accessor.query(query):

fns |= set(p.getCoveredFilenames())

return fns

def build_product_from_filename(filename, place, baseclass, registry, accessor):

filaname = os.path.abspath(filename)

for c in registry.find_subclasses(baseclass):

if c.updateProduct != baseclass.updateProduct:

#separate normal and update file calls

continue

try:

return c.fromFilename(filename, place, accessor)

except ValueError:

continue

raise ValueError('product class not found')

if __name__ == '__main__':

from runmacs.processor.config import config

logging.basicConfig(level=logging.DEBUG)

parser = argparse.ArgumentParser(description='generates macs products')

parser.add_argument('--crawl',dest='crawl',action='store_true')

parser.add_argument('--skip-crawl',dest='crawl',action='store_false')

parser.set_defaults(crawl=True)

parser.add_argument('--crawl-dir',dest='crawlDir',type=str,default='.')

parser.add_argument('--rescan',dest='rescan',action='store_true')

parser.add_argument('--no-rescan',dest='rescan',action='store_false')

parser.set_defaults(rescan=False)

#shoud we generate derrived products?

parser.add_argument('--derrive',dest='derrive',action='store_true')

parser.add_argument('--no-derrive',dest='derrive',action='store_false')

parser.set_defaults(derrive=True)

parser.add_argument('--production',dest='production',action='store_true')

parser.add_argument('--devel',dest='production',action='store_false')

parser.set_defaults(production=False)

parser.add_argument('--collection', default=None, type=int, help="collection id to crawl")

parser.add_argument('--rescan-product', type=str)

parser.add_argument('--ldb',dest='ldb',default=False,action='store_true')

args = parser.parse_args()

if args.production:

if config['database']['type'] == 'mongodb':

db = metaStorage.MongoDBMetaStorage(config['database']['connection'], config['database']['collection'])

else:

raise RuntimeError('unknown database type "%s"!'%config['database']['type'])

#from raven.handlers.logging import SentryHandler

#handler = SentryHandler('http://4d1399ca040f413d892f2da03a418771:a39aaab9d0754bce910aba7eb06baf27@blesshuhn.meteo.physik.uni-muenchen.de:8001/3')

#from raven.conf import setup_logging

#setup_logging(handler)

crawlDirs = config['data']

else:

if args.ldb:

db = metaStorage.LevelDBMetaStorage('products.ldb')

else:

db = metaStorage.MongoDBMetaStorage('mongodb://blesshuhn:27017/', 'macsServer_devel')

crawlDirs = {}

for crawlPlace, params in crawlDirs.items():

if params['method'] != 'local' and args.crawl:

logger.error('cannot crawl "%s" source method "%s", skipping it!', crawlPlace, params['method'])

continue

crawlDirs = []

if args.crawl:

crawlDirs.append(CrawlRequest(params['folder'],

product.ImportedFileProduct,

crawlPlace))

if 'updatesFolder' in params:

crawlDirs.append(CrawlRequest(params['updatesFolder'],

product.UpdateFileProduct,

crawlPlace))

if args.collection is None:

collections = find_collections_in_folder(os.path.join(params['folder'],

'..',

'collections'))

else:

with open(os.path.join(params['folder'], '..', 'collections', 'collection_{}.yaml'.format(args.collection))) as collfile:

collections = [collection_from_dict(args.collection, yaml.load(collfile))]

pb = ProductBuilder(db,

registry=get_default_registry(),

collections=collections)

pb.needToCrawl = crawlDirs

pb.needToScan = args.derrive

pb.rescanAll = args.rescan

pb.rescanProduct = args.rescan_product

logger.info('productBuilder start for crawl place "%s"!', crawlPlace)

pb.run()

Coverage for runmacs/processor/productBuilder.py : 89%

247 statements 227 run 20 missing 54 excluded 11 partial