in src/process_transcription_full_text.py [0:0]
def parse_detected_entities_response(detected_entities_response, entities):
if 'ErrorList' in detected_entities_response and len(detected_entities_response['ErrorList']) > 0:
logger.error("encountered error during batch_detect_entities")
logger.error("error:" + json.dumps(detected_entities_response['ErrorList'], indent=4))
if 'ResultList' in detected_entities_response:
result_list = detected_entities_response["ResultList"]
# entities = {}
for result in result_list:
detected_entities = result["Entities"]
for detected_entity in detected_entities:
if float(detected_entity["Score"]) >= ENTITY_CONFIDENCE_THRESHOLD:
entity_type = detected_entity["Type"]
if entity_type != 'QUANTITY':
text = detected_entity["Text"]
if entity_type == 'LOCATION' or entity_type == 'PERSON' or entity_type == 'ORGANIZATION':
if not text.isupper():
text = string.capwords(text)
if entity_type in entities:
entities[entity_type].add(text)
else:
entities[entity_type] = set([text])
return entities
else:
return {}