in backends/python/server/text_embeddings_server/models/flash_mistral.py [0:0]
def batch_type(self) -> Union[FlashBatch, PaddedBatch]:
# for hpu devices, we use PaddedBatch as we do not have real varlen fwd yet
return FlashBatch if self.device.type != "hpu" else PaddedBatch