in convert_csv.py [0:0]
def get_dataframe(filename, export_type):
split_filename = filename.split('/')
print("Converting " + split_filename[-1] + " for agent " + split_filename[-3] + "...")
text_file = sc.textFile(filename)
header = text_file.first()
headerless_file = text_file.filter(lambda x: x != header)
rdd = headerless_file.map(lambda line: parse_line(line, export_type))
return sqlContext.createDataFrame(rdd, EXPORT_TYPES[export_type])