in codes/data_processing.py [0:0]
def pre_processing (x, genome_dict): ## transfer the K-mer tokenized DNA sequences into integers ## x = x.split() for i in range (len(x)): x[i] = genome_dict[x[i]] return x