in submission_code/tools.py [0:0]
def __init__(self, config, pad_id):
super(Transformer, self).__init__()
encoder_config = BertConfig(
vocab_size=config.src_vocab_size,
hidden_size=config.h_size,
num_hidden_layers=config.enc_layers,
num_attention_heads=config.n_heads,
intermediate_size=config.d_ff,
hidden_dropout_prob = config.dropout,
pad_token_id=pad_id,
)
decoder_config = BertConfig(
vocab_size=config.tgt_vocab_size,
hidden_size=config.h_size,
num_hidden_layers=config.dec_layers,
num_attention_heads=config.n_heads,
intermediate_size=config.d_ff,
hidden_dropout_prob = config.dropout,
pad_token_id=pad_id,
is_decoder=True,
add_cross_attention=True,
)
encoder_decoder_config = EncoderDecoderConfig.from_encoder_decoder_configs(encoder_config, decoder_config)
self.tr = EncoderDecoderModel(config=encoder_decoder_config)
if config.joined_vocab:
self.tr.encoder.embeddings.word_embeddings = self.tr.decoder.bert.embeddings.word_embeddings