in src/createEntityRecognizer.py [0:0]
def lambda_handler(event, context):
jobName = "aim317-recognizer" + '-' + str(uuid.uuid4())
client = boto3.client('comprehend')
s3TrainingBucket = os.environ['ComprehendAnnotationBucket']
s3AnnotationBucket = os.environ['ComprehendAnnotationBucket']
response = client.create_entity_recognizer(
RecognizerName=jobName,
DataAccessRoleArn=os.environ['ComprehendARN'],
InputDataConfig={
'DataFormat': 'COMPREHEND_CSV',
"EntityTypes": [
{
"Type": "MOVEMENT"
},
{
"Type": "BRAIN"
},
{
"Type": "ETHICS"
}
],
'Documents': {
'S3Uri': "s3://" + s3TrainingBucket + "/comprehend/train/train.csv",
'InputFormat': 'ONE_DOC_PER_LINE'
},
'Annotations': {
'S3Uri': "s3://" + s3AnnotationBucket + "/comprehend/train/annotations.csv",
}
},
LanguageCode='en',
VersionName= 'v001'
)
return {
'EntityRecognizerArn': response['EntityRecognizerArn']
}