in code/workflow/implementations/autopilot/bp_init_stage.py [0:0]
def get_config(self) :
processing_dir = "/opt/ml/processing"
output_content_type = "CSV"
input_dict = []
inputs = self.create_processing_inputs(processing_dir, self.flow, self.flow_uri)
for inp in inputs :
input_dict += [inp]
output_dict = [self.create_processing_output(self.output_name, self.output_path, processing_dir)]
job_arguments=self.create_container_arguments(self.output_name, output_content_type)
config = {
"ProcessingJobName": self.name,
"ClusterConfig": {
"InstanceType": self.base_config.dp_instance_type,
"InstanceCount": self.base_config.dp_instance_count,
"VolumeSizeInGB": 30
},
"AppSpecification": {
"ImageUri": self.container_uri,
"ContainerArguments": job_arguments,
},
"RoleArn": self.base_config.iam_role,
"ProcessingInputs": input_dict,
"ProcessingOutputConfig": {
"Outputs": output_dict
},
"StoppingCondition": {
"MaxRuntimeInSeconds": 86400
}
}
return config