in cluster-trace-gpu-v2020/analysis/utils.py [0:0]
def get_hourly_task_request(df): # df = dftjkix
sum_df_list = []
df = add_hour_date(df.copy())
# for day in sorted(df.dayofyear.unique()):
for date in sorted(df.date.unique()):
# tempdf = df[df.dayofyear==day]
tempdf = df[df.date==date]
res_df = tempdf.groupby('hour').count()[['job_name']]
res_df.rename(columns={'job_name':date}, inplace=True)
sum_df_list.append(res_df.T)
out_df = pd.DataFrame().append(sum_df_list)
return out_df.dropna() # if a day contains hours of NaN, it is not a typical day