rhelmer · December 9, 2011 22:11 · peterbe · Dec 9, 2011
diff --git a/gistfile1.diff b/gistfile1.diff
 diff --git a/socorro/processor/processor.py b/socorro/processor/processor.py
 index b3964a1..1754215 100755
 --- a/socorro/processor/processor.py
 +++ b/socorro/processor/processor.py
 @@ -123,6 +123,8 @@ class Processor(object):
     self.prefixSignatureRegEx = re.compile(self.config.prefixSignatureRegEx)
     self.signaturesWithLineNumbersRegEx = re.compile(self.config.signaturesWithLineNumbersRegEx)
 
 +    self.productIdMap = []
 +
     self.reportsTable = sch.ReportsTable(logger=config.logger)
     self.extensionsTable = sch.ExtensionsTable(logger=config.logger)
     self.framesTable = sch.FramesTable(logger=config.logger)
 @@ -170,7 +172,7 @@ class Processor(object):
       logger.debug("success")
       db_conn.commit()
     except sdb.exceptions_eligible_for_retry:
 -      logger.debug("timout trouble")
 +      logger.debug("timeout trouble")
       raise
     except sdb.db_module.ProgrammingError, x:
       logger.debug('the priority jobs table (%s) already exists',
 @@ -656,6 +658,19 @@ class Processor(object):
     """
     #logger.debug("starting insertReportIntoDatabase")
     product = Processor.getJsonOrWarn(jsonDocument,'ProductName',processorErrorMessages,None, 30)
 +    productId = Processor.getJsonOrWarn(jsonDocument,'ProductId',processorErrorMessages,None, 30)
 +
 +    # in some cases, we will receive products with the same name but different ID. cache the result.
 +    if (not self.productIdMap):
 +      self.productIdMap = self.loadProductIdMap()
 +    logger.debug("product ID map: " + str(self.productIdMap))
 +    logger.debug([x[0] for x in productIdMap])
 +    for p in productIdMap:
 +      if productId == p.productId:
 +        if product != p.product and p.rewrite:
 +          logger.info("Product name %s rewritten to %s", (product, p.product_name))
 +          product = p.product_name
 +
     version = Processor.getJsonOrWarn(jsonDocument,'Version', processorErrorMessages,None,16)
     buildID =   Processor.getJsonOrWarn(jsonDocument,'BuildID', processorErrorMessages,None,16)
     url = sutil.lookupLimitedStringOrNone(jsonDocument, 'URL', 255)
 @@ -836,3 +851,27 @@ class Processor(object):
                                            showTraceback=False)
     except KeyError:
       self.config.logger.info('no Elastic Search URL has been configured')
 +
 +
 +  #-----------------------------------------------------------------------------------------------------------------
 +  def loadProductIdMap(self):
 +    logger.debug('test1')
 +    logger.debug(self.databaseConnectionPool.connectionCursorPair)
 +    db_conn, db_cur = self.databaseConnectionPool.connectionCursorPair()
 +    productIdMap = []
 +    try:
 +      logger.debug("attempting to load product_productid_map")
 +      db_cur.execute("SELECT * FROM product_productid_map")
 +      productIdList = db_cur.fetchall()
 +      logger.debug("done loading product_productid_map")
 +      db_conn.commit()
 +    except:
 +      logger.error('Unable to load product_productid_map')
 +      db_conn.rollback()
 +      raise
 +    
 +    columns = ('product_name', 'productid', 'rewrite', 'version_began', 'version_ended')
 +    for result in productIdList:
 +      productIdMap.append(dict(x for x in zip(columns, result)))
 +
 +    return productIdMap
	diff --git a/socorro/processor/processor.py b/socorro/processor/processor.py
	index b3964a1..1754215 100755
	--- a/socorro/processor/processor.py
	+++ b/socorro/processor/processor.py
	@@ -123,6 +123,8 @@ class Processor(object):
	self.prefixSignatureRegEx = re.compile(self.config.prefixSignatureRegEx)
	self.signaturesWithLineNumbersRegEx = re.compile(self.config.signaturesWithLineNumbersRegEx)

	+ self.productIdMap = []
	+
	self.reportsTable = sch.ReportsTable(logger=config.logger)
	self.extensionsTable = sch.ExtensionsTable(logger=config.logger)
	self.framesTable = sch.FramesTable(logger=config.logger)
	@@ -170,7 +172,7 @@ class Processor(object):
	logger.debug("success")
	db_conn.commit()
	except sdb.exceptions_eligible_for_retry:
	- logger.debug("timout trouble")
	+ logger.debug("timeout trouble")
	raise
	except sdb.db_module.ProgrammingError, x:
	logger.debug('the priority jobs table (%s) already exists',
	@@ -656,6 +658,19 @@ class Processor(object):
	"""
	#logger.debug("starting insertReportIntoDatabase")
	product = Processor.getJsonOrWarn(jsonDocument,'ProductName',processorErrorMessages,None, 30)
	+ productId = Processor.getJsonOrWarn(jsonDocument,'ProductId',processorErrorMessages,None, 30)
	+
	+ # in some cases, we will receive products with the same name but different ID. cache the result.
	+ if (not self.productIdMap):
	+ self.productIdMap = self.loadProductIdMap()
	+ logger.debug("product ID map: " + str(self.productIdMap))
	+ logger.debug([x[0] for x in productIdMap])
	+ for p in productIdMap:
	+ if productId == p.productId:
	+ if product != p.product and p.rewrite:
	+ logger.info("Product name %s rewritten to %s", (product, p.product_name))
	+ product = p.product_name
	+
	version = Processor.getJsonOrWarn(jsonDocument,'Version', processorErrorMessages,None,16)
	buildID = Processor.getJsonOrWarn(jsonDocument,'BuildID', processorErrorMessages,None,16)
	url = sutil.lookupLimitedStringOrNone(jsonDocument, 'URL', 255)
	@@ -836,3 +851,27 @@ class Processor(object):
	showTraceback=False)
	except KeyError:
	self.config.logger.info('no Elastic Search URL has been configured')
	+
	+
	+ #-----------------------------------------------------------------------------------------------------------------
	+ def loadProductIdMap(self):
	+ logger.debug('test1')
	+ logger.debug(self.databaseConnectionPool.connectionCursorPair)
	+ db_conn, db_cur = self.databaseConnectionPool.connectionCursorPair()
	+ productIdMap = []
	+ try:
	+ logger.debug("attempting to load product_productid_map")
	+ db_cur.execute("SELECT * FROM product_productid_map")
	+ productIdList = db_cur.fetchall()
	+ logger.debug("done loading product_productid_map")
	+ db_conn.commit()
	+ except:
	+ logger.error('Unable to load product_productid_map')
	+ db_conn.rollback()
	+ raise
	+
	+ columns = ('product_name', 'productid', 'rewrite', 'version_began', 'version_ended')
	+ for result in productIdList:
	+ productIdMap.append(dict(x for x in zip(columns, result)))
	+
	+ return productIdMap
No results found