in o2a/mappers/spark_mapper.py [0:0]
def to_tasks_and_relations(self):
action_task = Task(
task_id=self.name,
template_name="spark.tpl",
template_params=dict(
job_name=self.job_name,
spark_job=dict(
args=self.application_args,
jar_file_uris=self.dataproc_jars,
file_uris=self.hdfs_files,
archive_uris=self.hdfs_archives,
properties=self.spark_opts,
main_jar_file_uri=self.java_jar,
main_class=self.java_class
)
),
)
tasks = [action_task]
relations: List[Relation] = []
prepare_task = self.prepare_extension.get_prepare_task()
if prepare_task:
tasks, relations = self.prepend_task(prepare_task, tasks, relations)
return tasks, relations