in cluster-trace-gpu-v2020/analysis/utils.py [0:0]
def add_hour_date(df):
if 'start_date' not in df:
if 'start_time_t' in df:
target_col = 'start_time_t'
elif 'start_time' in df:
target_col = 'start_time'
else:
print('start_time, start_time_t, dayofyear unfound in df')
return None
df['start_date'] = df[target_col].apply(lambda x: pd.Timestamp(x, unit='s', tz='Asia/Shanghai'))
if 'date' not in df:
df['date'] = df['start_date'].apply(lambda x: x.date())
if 'hour' not in df:
df['hour'] = df['start_date'].apply(lambda x: x.hour)
return df