in aiops/RCRank/model/modules/QueryFormer/utils.py [0:0]
def get_hist_file(hist_path, bin_number = 50):
hist_file = pd.read_csv(hist_path)
for i in range(len(hist_file)):
freq = hist_file['freq'][i]
freq_np = np.frombuffer(bytes.fromhex(freq), dtype=np.float)
hist_file['freq'][i] = freq_np
table_column = []
for i in range(len(hist_file)):
table = hist_file['table'][i]
col = hist_file['column'][i]
table_alias = ''.join([tok[0] for tok in table.split('_')])
if table == 'movie_info_idx': table_alias = 'mi_idx'
combine = '.'.join([table_alias,col])
table_column.append(combine)
hist_file['table_column'] = table_column
for rid in range(len(hist_file)):
hist_file['bins'][rid] = \
[int(i) for i in hist_file['bins'][rid][1:-1].split(' ') if len(i)>0]
if bin_number != 50:
hist_file = re_bin(hist_file, bin_number)
return hist_file