Summary: 8 instances, 4 unique Text Count pred_mask[0] = 0 # TODO: remove 2 encoder = TransformerModel(params, dico, is_encoder=True, with_output=True) # TODO: only output when necessary - len(params.clm_steps + params.mlm_steps) > 0 2 # TODO: add extra layer norm here? 2 if False: # AMP checkpoint reloading is buggy, we cannot do that - TODO: fix - https://github.com/NVIDIA/apex/issues/250 2