in sagemaker/source/preprocessing/dataframewriter.py [0:0]
def flush_buffer(self):
df = pd.DataFrame(columns=self.columns, data=self.data)
df.drop_duplicates(inplace=True)
print('\tWriting {} records'.format(len(df)))
if self.first_write:
df.to_csv(path_or_buf=self.filename, mode='w', header=True, index=False)
self.first_write = False
else:
df.to_csv(path_or_buf=self.filename, mode='a', header=False, index=False)
self.data = []