def pre_processing()

in codes/data_processing.py [0:0]


def pre_processing (x, genome_dict):
    ## transfer the K-mer tokenized DNA sequences into integers ##
    x = x.split()
    for i in range (len(x)):
        x[i] = genome_dict[x[i]]
        
    return x