in notebook/utils/wf.py [0:0]
def _get_merged_df(cls, bucket, prefix, s3_client, show_header=True, has_header=True, maxkeys=10) :
files = []
skip = 0
kwargs = {'Bucket': bucket, 'Prefix': prefix, 'MaxKeys': maxkeys}
resp = s3_client.list_objects_v2(**kwargs)
for obj in resp['Contents'] :
if has_header and not show_header :
skip = 1
if has_header and show_header :
files.append(pd.read_csv("s3://{}/{}".format(bucket, obj["Key"])))
else :
files.append(pd.read_csv("s3://{}/{}".format(bucket, obj["Key"]), skiprows=skip, header=None))
df = pd.concat(files)
return df