in glide_text2im/tokenizer/bpe.py [0:0]
def get_encoder():
root_dir = os.path.dirname(os.path.abspath(__file__))
with gzip.open(os.path.join(root_dir, "encoder.json.gz"), "r") as f:
encoder = json.load(f)
with gzip.open(os.path.join(root_dir, "vocab.bpe.gz"), "r") as f:
bpe_data = str(f.read(), "utf-8")
bpe_merges = [tuple(merge_str.split()) for merge_str in bpe_data.split("\n")[1:-1]]
return Encoder(
encoder=encoder,
bpe_merges=bpe_merges,
)