824 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (22:1026, 100%) - server/text_generation_server/layers/gptq/quantize.py (22:1026, 100%) 638 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (30:923, 100%) - server/text_generation_server/models/custom_modeling/bloom_modeling.py (30:923, 100%) 563 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (26:728, 84%) - server/text_generation_server/models/custom_modeling/idefics2.py (26:728, 84%) 458 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (8:817, 100%) - server/text_generation_server/models/custom_modeling/clip.py (8:817, 100%) 374 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (82:556, 51%) - server/text_generation_server/models/seq2seq_lm.py (84:558, 50%) 355 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (25:471, 77%) - server/text_generation_server/models/custom_modeling/idefics3.py (25:471, 77%) 287 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (9:410, 100%) - server/text_generation_server/models/custom_modeling/siglip.py (9:410, 100%) 283 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (347:693, 38%) - server/text_generation_server/models/custom_modeling/mllama.py (335:681, 34%) 225 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (646:920, 31%) - server/text_generation_server/models/seq2seq_lm.py (660:934, 30%) 214 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (51:381, 30%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (48:375, 29%) 207 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (112:373, 73%) - server/text_generation_server/cli.py (115:376, 72%) 204 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (11:282, 100%) - server/text_generation_server/layers/mlp.py (11:282, 100%) 201 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (36:269, 46%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (37:270, 46%) 193 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (12:238, 100%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (12:238, 100%) 190 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (32:265, 31%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (38:269, 30%) 186 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (176:484, 47%) - server/text_generation_server/utils/logits_process.py (175:483, 46%) 181 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (29:287, 21%) - server/text_generation_server/models/vlm_causal_lm.py (15:278, 19%) 180 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (326:540, 21%) - server/text_generation_server/models/vlm_causal_lm.py (318:535, 19%) 172 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (532:729, 24%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (566:762, 23%) 165 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/hub.py (12:234, 100%) - server/text_generation_server/utils/hub.py (12:234, 100%) 152 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (29:216, 80%) - server/text_generation_server/layers/moe/__init__.py (44:231, 70%) 147 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (6:220, 100%) - server/text_generation_server/utils/merges/strategies.py (6:220, 100%) 147 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (272:441, 23%) - server/text_generation_server/utils/tokens.py (263:432, 28%) 144 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (163:306, 15%) - server/text_generation_server/models/__init__.py (217:360, 8%) 141 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (35:238, 19%) - server/text_generation_server/models/custom_modeling/mllama.py (40:240, 17%) 139 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (10:167, 22%) - server/text_generation_server/utils/tokens.py (8:164, 26%) 135 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (146:316, 47%) - server/text_generation_server/utils/weights.py (139:309, 48%) 132 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (21:253, 100%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (22:254, 100%) 132 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (7:191, 100%) - server/text_generation_server/layers/medusa.py (7:191, 100%) 127 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (51:213, 35%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (52:214, 34%) 124 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (35:182, 24%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (33:179, 24%) 121 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (345:496, 29%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (370:521, 27%) 118 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (768:916, 16%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (792:943, 16%) 116 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (132:279, 50%) - server/text_generation_server/utils/adapter.py (135:282, 48%) 115 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (42:190, 28%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (40:187, 27%) 113 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (192:322, 27%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (227:357, 25%) 110 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (283:408, 21%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (295:420, 21%) 109 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:168, 22%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:165, 23%) 107 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/quantization.py (8:140, 83%) - server/text_generation_server/utils/quantization.py (10:143, 65%) 106 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:165, 27%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:162, 27%) 105 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (47:158, 19%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (51:162, 19%) 105 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (60:171, 17%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (51:162, 18%) 99 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (383:488, 10%) - server/text_generation_server/models/__init__.py (521:626, 5%) 98 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (61:163, 16%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (52:154, 17%) 98 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (48:150, 18%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (52:154, 17%) 96 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/weights.py (13:146, 100%) - server/text_generation_server/adapters/weights.py (13:146, 100%) 95 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (24:136, 16%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (22:133, 16%) 93 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (249:365, 17%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (263:379, 16%) 92 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (158:276, 47%) - server/text_generation_server/models/custom_modeling/llava_next.py (158:276, 46%) 88 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/bnb.py (9:124, 100%) - server/text_generation_server/layers/bnb.py (9:124, 100%) 85 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (147:279, 44%) - server/text_generation_server/layers/lora.py (153:285, 44%) 81 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (135:229, 12%) - server/text_generation_server/models/custom_modeling/idefics3.py (134:228, 17%) 81 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (390:496, 19%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (834:943, 11%) 81 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (810:916, 11%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (415:521, 18%) 81 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (134:228, 17%) - server/text_generation_server/models/custom_modeling/idefics2.py (135:229, 12%) 80 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (568:669, 13%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (602:703, 11%) 80 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (20:121, 34%) - server/text_generation_server/utils/adapter.py (20:121, 33%) 79 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/tensor_parallel.py (106:197, 44%) - server/text_generation_server/layers/tensor_parallel.py (113:204, 41%) 78 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (30:127, 21%) - server/text_generation_server/adapters/lora.py (32:129, 20%) 75 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (499:603, 12%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (527:631, 12%) 75 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (173:255, 14%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (182:264, 13%) 75 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (173:255, 14%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (182:264, 13%) 74 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/convert.py (12:114, 100%) - server/text_generation_server/utils/convert.py (12:114, 100%) 73 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/hpu.py (100:180, 45%) - server/text_generation_server/layers/gptq/ipex.py (43:123, 68%) 72 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (157:237, 20%) - server/text_generation_server/layers/gptq/__init__.py (193:273, 18%) 71 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (597:697, 11%) - server/text_generation_server/utils/tokens.py (545:645, 13%) 69 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (125:198, 13%) - server/text_generation_server/layers/rotary.py (124:197, 14%) 68 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (24:101, 74%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (24:101, 72%) 68 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (186:260, 11%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (182:256, 12%) 68 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (186:260, 11%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (182:256, 12%) 67 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (172:256, 10%) - server/text_generation_server/utils/tokens.py (165:249, 12%) 67 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (110:186, 12%) - server/text_generation_server/models/mllama_causal_lm.py (88:164, 21%) 66 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (738:815, 8%) - server/text_generation_server/models/custom_modeling/mllama.py (765:842, 8%) 66 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (252:332, 8%) - server/text_generation_server/models/custom_modeling/mllama.py (244:325, 8%) 65 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:93, 18%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:90, 18%) 63 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (64:135, 11%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (72:143, 11%) 62 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (453:532, 10%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (414:493, 11%) 60 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (259:331, 11%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (269:341, 10%) 60 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (259:331, 11%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (269:341, 10%) 59 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (623:698, 7%) - server/text_generation_server/models/vlm_causal_lm.py (616:691, 6%) 59 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (396:472, 11%) - server/text_generation_server/layers/rotary.py (397:473, 12%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (270:336, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (322:388, 8%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (64:131, 8%) - server/text_generation_server/models/custom_modeling/idefics3.py (63:130, 12%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (146:207, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (148:209, 8%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (411:486, 9%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (420:495, 9%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (291:357, 12%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (291:357, 12%) 58 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (63:130, 12%) - server/text_generation_server/models/custom_modeling/idefics2.py (64:131, 8%) 57 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/tensor_parallel.py (9:90, 31%) - server/text_generation_server/layers/tensor_parallel.py (11:92, 30%) 57 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (489:560, 11%) - server/text_generation_server/layers/rotary.py (490:561, 11%) 56 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (957:1024, 5%) - server/text_generation_server/models/__init__.py (1810:1877, 3%) 54 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (386:456, 10%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (414:484, 9%) 54 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (227:289, 13%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (245:307, 12%) 54 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (254:318, 15%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (258:322, 14%) 54 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (502:565, 10%) - server/text_generation_server/layers/fp8.py (378:441, 12%) 53 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (10:68, 100%) - server/text_generation_server/utils/peft.py (10:68, 100%) 53 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (314:374, 12%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (318:378, 12%) 53 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/watermark.py (38:98, 80%) - server/text_generation_server/utils/watermark.py (38:98, 80%) 53 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (356:415, 14%) - server/text_generation_server/adapters/lora.py (373:432, 14%) 52 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (340:411, 2%) - server/text_generation_server/models/flash_causal_lm.py (320:391, 2%) 52 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (13:75, 69%) - server/text_generation_server/models/types.py (13:75, 63%) 52 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/loader.py (9:84, 49%) - server/text_generation_server/layers/compressed_tensors/loader.py (18:89, 40%) 52 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:178, 12%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:186, 11%) 51 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (55:121, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (55:121, 7%) 51 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (75:166, 13%) - server/text_generation_server/utils/logits_process.py (78:169, 12%) 51 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (299:353, 10%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (330:384, 7%) 51 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (278:332, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (299:353, 10%) 50 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (339:406, 17%) - server/text_generation_server/utils/weights.py (329:396, 17%) 50 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1399:1459, 2%) - server/text_generation_server/models/flash_causal_lm.py (1232:1292, 2%) 49 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (326:383, 9%) - server/text_generation_server/layers/fp8.py (263:320, 11%) 49 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (419:476, 11%) - server/text_generation_server/models/transformers_flash_vlm.py (430:490, 10%) 49 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (52:104, 12%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (51:103, 10%) 49 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (839:896, 6%) - server/text_generation_server/models/transformers_flash_vlm.py (430:490, 10%) 49 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (54:106, 10%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (49:101, 12%) 48 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (52:106, 11%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (57:111, 10%) 48 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (591:647, 8%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (612:668, 8%) 48 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (417:471, 13%) - server/text_generation_server/adapters/lora.py (434:488, 12%) 48 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (473:527, 6%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (505:559, 6%) 48 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (134:206, 13%) - server/text_generation_server/adapters/lora.py (138:210, 12%) 47 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:101, 14%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:98, 14%) 47 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (563:621, 5%) - server/text_generation_server/models/vlm_causal_lm.py (554:612, 5%) 47 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (8:78, 100%) - server/text_generation_server/layers/exl2.py (8:78, 100%) 47 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (189:240, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (185:236, 10%) 46 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (385:438, 12%) - server/text_generation_server/layers/gptq/__init__.py (383:436, 12%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (83:139, 42%) - server/text_generation_server/layers/moe/unquantized.py (107:163, 23%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (108:162, 11%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (63:117, 6%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (108:162, 11%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (107:161, 9%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (110:164, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (63:117, 6%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (63:117, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (107:161, 9%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (110:164, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (105:159, 11%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (912:957, 2%) - server/text_generation_server/models/flash_causal_lm.py (899:944, 2%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (7:81, 6%) - server/text_generation_server/models/seq2seq_lm.py (7:82, 6%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (465:522, 7%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (477:534, 7%) 45 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (63:117, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (105:159, 11%) 44 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:220, 10%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:268, 10%) 44 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (855:909, 2%) - server/text_generation_server/models/flash_causal_lm.py (842:896, 2%) 44 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (452:506, 7%) - server/text_generation_server/utils/tokens.py (429:483, 8%) 44 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/utils.py (23:108, 100%) - server/text_generation_server/utils/merges/utils.py (23:108, 100%) 44 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/awq/conversion_utils.py (5:97, 100%) - server/text_generation_server/layers/awq/conversion_utils.py (5:97, 100%) 43 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2432:2477, 2%) - server/text_generation_server/models/flash_causal_lm.py (2333:2378, 2%) 43 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (844:891, 5%) - server/text_generation_server/models/causal_lm.py (814:861, 6%) 43 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (384:433, 7%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (417:466, 7%) 43 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (152:201, 7%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (163:212, 7%) 43 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (305:356, 8%) - server/text_generation_server/layers/rotary.py (309:360, 8%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (28:110, 21%) - server/text_generation_server/models/custom_modeling/llava_next.py (28:110, 21%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (112:162, 10%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (156:206, 9%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (326:376, 9%) - server/text_generation_server/models/custom_modeling/idefics2.py (327:377, 6%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (272:321, 10%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (699:749, 5%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (327:377, 6%) - server/text_generation_server/models/custom_modeling/idefics3.py (326:376, 9%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (665:716, 5%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (307:356, 9%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (734:782, 6%) - server/text_generation_server/models/custom_modeling/idefics2.py (733:781, 6%) 42 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (207:250, 8%) - server/text_generation_server/layers/rotary.py (205:248, 8%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (477:523, 8%) - server/text_generation_server/models/custom_modeling/idefics3.py (476:522, 8%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1345:1392, 1%) - server/text_generation_server/models/flash_causal_lm.py (1170:1217, 2%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (276:323, 10%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (327:374, 9%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (142:187, 9%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (175:220, 9%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/hpu.py (105:148, 25%) - server/text_generation_server/layers/gptq/triton.py (273:316, 13%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (387:436, 9%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (393:442, 9%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (877:921, 5%) - server/text_generation_server/models/custom_modeling/mllama.py (907:951, 5%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (152:238, 1%) - server/text_generation_server/models/flash_causal_lm.py (122:208, 2%) 41 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (12:56, 38%) - server/text_generation_server/layers/moe/unquantized.py (18:62, 21%) 40 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (431:472, 1%) - server/text_generation_server/models/flash_causal_lm.py (428:469, 2%) 40 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (246:287, 1%) - server/text_generation_server/models/flash_causal_lm.py (210:251, 2%) 40 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (282:342, 9%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (294:354, 9%) 40 duplicated lines in: - backends/gaudi/server/text_generation_server/models/model.py (16:64, 40%) - server/text_generation_server/models/model.py (23:71, 30%) 39 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (440:482, 9%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (463:505, 8%) 39 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (860:903, 4%) - server/text_generation_server/models/vlm_causal_lm.py (875:918, 4%) 38 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (334:382, 10%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (340:388, 10%) 38 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/speculative.py (9:52, 100%) - server/text_generation_server/layers/speculative.py (9:52, 100%) 37 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (252:295, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:302, 9%) 37 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (286:326, 10%) - server/text_generation_server/adapters/lora.py (302:342, 9%) 37 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (528:582, 9%) - server/text_generation_server/utils/logits_process.py (542:596, 9%) 36 duplicated lines in: - backends/gaudi/server/text_generation_server/tracing.py (6:63, 100%) - server/text_generation_server/tracing.py (6:63, 100%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (542:579, 5%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (502:539, 6%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (114:154, 18%) - server/text_generation_server/models/custom_modeling/llava_next.py (114:154, 17%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (203:240, 7%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (150:186, 7%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (142:178, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (199:236, 7%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:234, 6%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:236, 6%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:709, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:804, 4%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (466:503, 6%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (493:530, 6%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (247:284, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (340:377, 4%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (279:319, 6%) - server/text_generation_server/layers/fp8.py (219:259, 7%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (247:284, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (309:346, 7%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (309:346, 7%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (265:302, 7%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (182:222, 15%) - server/text_generation_server/layers/moe/fp8.py (109:149, 24%) 35 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (288:325, 5%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (265:302, 7%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (829:873, 4%) - server/text_generation_server/models/custom_modeling/mllama.py (859:903, 4%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/vlm.py (20:67, 72%) - server/text_generation_server/models/custom_modeling/vlm.py (20:69, 72%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (518:558, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (498:538, 7%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/loader.py (90:148, 32%) - server/text_generation_server/layers/compressed_tensors/loader.py (91:149, 26%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (551:591, 6%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (554:594, 6%) 34 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (241:277, 9%) - server/text_generation_server/layers/gptq/__init__.py (284:320, 8%) 33 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (224:263, 8%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (273:312, 7%) 33 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (239:284, 9%) - server/text_generation_server/adapters/lora.py (255:300, 8%) 33 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (509:550, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (540:581, 4%) 33 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (700:734, 1%) - server/text_generation_server/models/flash_causal_lm.py (704:738, 1%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (426:464, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (417:455, 8%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (174:211, 6%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (177:214, 9%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (487:523, 7%) - server/text_generation_server/models/custom_modeling/idefics2.py (744:781, 4%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (257:296, 5%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (265:304, 5%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (147:182, 5%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (148:183, 5%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (160:193, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:299, 8%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (745:782, 4%) - server/text_generation_server/models/custom_modeling/idefics3.py (486:522, 6%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:192, 9%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (335:368, 7%) 32 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1935:1975, 1%) - server/text_generation_server/models/flash_causal_lm.py (1724:1764, 1%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (110:146, 15%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (98:134, 21%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:291, 7%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (336:368, 7%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (216:256, 8%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (221:261, 9%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (285:317, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:298, 8%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/conv.py (5:41, 100%) - server/text_generation_server/layers/conv.py (5:41, 100%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (54:99, 11%) - server/text_generation_server/cli.py (62:107, 10%) 31 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (67:100, 15%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (61:94, 21%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (637:666, 1%) - server/text_generation_server/models/flash_causal_lm.py (648:677, 1%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (204:241, 9%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (222:259, 9%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1191:1228, 1%) - server/text_generation_server/models/flash_causal_lm.py (1065:1102, 1%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:385, 5%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (356:397, 5%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (376:407, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (368:399, 6%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (357:388, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (399:430, 4%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (111:143, 15%) - server/text_generation_server/layers/lora.py (117:149, 15%) 30 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (188:220, 5%) - server/text_generation_server/models/mllama_causal_lm.py (166:198, 9%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (905:939, 3%) - server/text_generation_server/models/vlm_causal_lm.py (920:954, 3%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:308, 4%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:316, 4%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:234, 7%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:236, 6%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (1025:1060, 3%) - server/text_generation_server/models/__init__.py (1881:1916, 1%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:105, 9%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:236, 6%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:105, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:208, 7%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (454:488, 7%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (493:527, 6%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:204, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:208, 7%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (162:192, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (198:228, 6%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (202:232, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (164:194, 4%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:234, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:208, 7%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:204, 7%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:236, 6%) 29 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (54:88, 8%) - server/text_generation_server/layers/gptq/__init__.py (72:106, 7%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (142:170, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (165:194, 3%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (806:840, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (791:825, 4%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (20:49, 12%) - server/text_generation_server/layers/moe/fp8.py (20:49, 19%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (561:590, 3%) - server/text_generation_server/models/seq2seq_lm.py (573:602, 3%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/model.py (104:142, 28%) - server/text_generation_server/models/model.py (144:181, 21%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (192:226, 8%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:233, 8%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (312:345, 4%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (321:354, 4%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (163:192, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (150:178, 6%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:159, 7%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:161, 8%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (195:224, 11%) - server/text_generation_server/server.py (223:252, 11%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (163:203, 7%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:206, 8%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (121:153, 7%) - server/text_generation_server/layers/gptq/__init__.py (151:183, 7%) 28 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (114:146, 8%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:155, 8%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/tensor_parallel.py (202:238, 15%) - server/text_generation_server/layers/tensor_parallel.py (208:244, 14%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (21:49, 11%) - server/text_generation_server/layers/moe/unquantized.py (19:47, 14%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (548:583, 5%) - server/text_generation_server/models/custom_modeling/idefics3.py (532:567, 5%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (159:191, 8%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (175:207, 8%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (217:247, 14%) - server/text_generation_server/layers/moe/__init__.py (240:270, 12%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:246, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (216:251, 3%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (361:394, 5%) - server/text_generation_server/layers/rotary.py (362:395, 5%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (281:320, 11%) - server/text_generation_server/utils/adapter.py (290:329, 11%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (13:41, 25%) - server/text_generation_server/layers/moe/fp8.py (21:49, 18%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (941:970, 3%) - server/text_generation_server/models/vlm_causal_lm.py (956:985, 2%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (395:424, 7%) - server/text_generation_server/layers/gptq/__init__.py (157:186, 7%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (482:511, 5%) - server/text_generation_server/models/vlm_causal_lm.py (956:985, 2%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (482:511, 5%) - server/text_generation_server/models/mllama_causal_lm.py (212:241, 8%) 27 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (941:970, 3%) - server/text_generation_server/models/mllama_causal_lm.py (212:241, 8%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (179:210, 12%) - server/text_generation_server/layers/mlp.py (83:114, 12%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (329:354, 7%) - server/text_generation_server/adapters/lora.py (347:372, 6%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (83:114, 12%) - server/text_generation_server/layers/mlp.py (179:210, 12%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (288:320, 1%) - server/text_generation_server/models/flash_causal_lm.py (254:286, 1%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (344:376, 4%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (355:387, 4%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:236, 4%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:248, 4%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (384:412, 3%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (400:428, 3%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:213, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (242:272, 5%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (109:139, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (213:243, 6%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (531:566, 1%) - server/text_generation_server/models/flash_causal_lm.py (528:563, 1%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1105:1134, 1%) - server/text_generation_server/models/flash_causal_lm.py (994:1023, 1%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (238:268, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (213:243, 6%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (54:81, 6%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (71:98, 5%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:269, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (242:272, 5%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (208:238, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (213:243, 6%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:275, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (242:272, 5%) 26 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (848:874, 3%) - server/text_generation_server/models/flash_causal_lm.py (2353:2379, 1%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (10:53, 12%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (11:55, 17%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2452:2477, 1%) - server/text_generation_server/models/seq2seq_lm.py (862:887, 3%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/utils.py (5:56, 100%) - server/text_generation_server/layers/gptq/utils.py (5:56, 100%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (421:452, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (366:397, 4%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2452:2477, 1%) - server/text_generation_server/models/causal_lm.py (818:843, 3%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (51:85, 7%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (46:79, 7%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (411:441, 7%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (411:441, 6%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (23:54, 8%) - server/text_generation_server/cli.py (31:59, 8%) 25 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (592:619, 3%) - server/text_generation_server/models/seq2seq_lm.py (604:631, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (506:533, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (452:478, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:268, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (244:272, 5%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (185:213, 5%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (247:275, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:243, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:139, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (244:272, 5%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (247:275, 5%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (718:744, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (818:890, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (241:269, 4%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:238, 6%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (355:385, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (367:397, 4%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (241:269, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:243, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (443:469, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (534:561, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:238, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (244:272, 5%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (401:427, 4%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (410:436, 4%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (351:379, 6%) - server/text_generation_server/layers/gptq/__init__.py (336:364, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:345, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (244:272, 5%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (148:179, 7%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (153:184, 7%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:345, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:243, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (185:213, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:243, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:268, 5%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (127:153, 6%) - server/text_generation_server/layers/gptq/__init__.py (393:419, 6%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (99:139, 8%) - server/text_generation_server/utils/weights.py (96:136, 8%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:139, 7%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:354, 3%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (422:452, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (367:397, 4%) 24 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (17:44, 6%) - server/text_generation_server/utils/logits_process.py (16:43, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:185, 7%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:406, 3%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (462:490, 4%) - server/text_generation_server/layers/fp8.py (343:371, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:233, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (242:269, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (245:272, 4%) - server/text_generation_server/layers/fp8.py (187:214, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (411:455, 8%) - server/text_generation_server/utils/weights.py (398:442, 8%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (484:511, 5%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (488:515, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:310, 5%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:406, 3%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (84:108, 4%) - server/text_generation_server/models/mllama_causal_lm.py (63:87, 7%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (120:144, 6%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (124:148, 7%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (78:102, 30%) - server/text_generation_server/models/types.py (86:110, 28%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/dist.py (13:42, 52%) - server/text_generation_server/utils/dist.py (16:45, 31%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (596:619, 3%) - server/text_generation_server/models/causal_lm.py (571:594, 3%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (113:144, 2%) - server/text_generation_server/models/__init__.py (154:185, 1%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:406, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:291, 6%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:284, 5%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:406, 3%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:266, 4%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:245, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:210, 5%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:245, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (352:377, 5%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (361:386, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:272, 4%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:245, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (544:570, 2%) - server/text_generation_server/layers/gptq/quantize.py (446:472, 2%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (186:218, 4%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (188:220, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:406, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:361, 5%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (300:331, 4%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (309:340, 4%) 23 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (446:472, 2%) - server/text_generation_server/layers/gptq/quantize.py (544:570, 2%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (483:507, 4%) - server/text_generation_server/models/flash_causal_lm.py (1728:1752, 1%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (138:160, 9%) - server/text_generation_server/server.py (145:167, 8%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/linear.py (5:28, 84%) - server/text_generation_server/layers/linear.py (21:44, 22%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1939:1963, 1%) - server/text_generation_server/models/vlm_causal_lm.py (957:981, 2%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (418:442, 4%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (426:450, 4%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1939:1963, 1%) - server/text_generation_server/models/mllama_causal_lm.py (213:237, 6%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (388:412, 3%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (75:98, 5%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:363, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:220, 5%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (10:49, 16%) - server/text_generation_server/layers/attention/kv_cache.py (27:66, 8%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (942:966, 2%) - server/text_generation_server/models/flash_causal_lm.py (1728:1752, 1%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (586:610, 5%) - server/text_generation_server/utils/logits_process.py (601:625, 5%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (82:105, 7%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (140:163, 6%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (58:81, 5%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (404:428, 3%) 22 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (561:595, 3%) - server/text_generation_server/utils/tokens.py (509:543, 4%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (389:415, 5%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (377:403, 6%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:235, 5%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:245, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (60:82, 4%) - server/text_generation_server/models/mllama_causal_lm.py (39:61, 6%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (425:453, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (462:490, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (208:233, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:351, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (110:132, 2%) - server/text_generation_server/models/mamba.py (145:166, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (557:579, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (508:530, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (494:518, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (521:545, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:342, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:245, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (712:733, 2%) - server/text_generation_server/models/vlm_causal_lm.py (707:728, 2%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (208:233, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:240, 5%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:265, 5%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:245, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (110:132, 2%) - server/text_generation_server/models/causal_lm.py (106:127, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (815:840, 3%) - server/text_generation_server/models/custom_modeling/idefics3.py (540:567, 4%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (556:583, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (800:825, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (362:386, 6%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (368:392, 6%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (273:301, 4%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (275:303, 4%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:136, 6%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:245, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (217:241, 5%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (219:243, 5%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (110:132, 2%) - server/text_generation_server/models/galactica.py (90:111, 21%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (720:746, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (736:762, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/cache.py (7:34, 100%) - server/text_generation_server/cache.py (7:34, 100%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (481:503, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (517:539, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2313:2336, 1%) - server/text_generation_server/models/flash_causal_lm.py (1906:1929, 1%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (501:529, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (453:481, 3%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (773:800, 1%) - server/text_generation_server/models/flash_causal_lm.py (775:802, 1%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (477:505, 1%) - server/text_generation_server/models/flash_causal_lm.py (470:498, 1%) 21 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (17:42, 11%) - server/text_generation_server/layers/lora.py (19:44, 10%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1385:1409, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (601:623, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (579:599, 3%) - server/text_generation_server/layers/fp8.py (467:487, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/__init__.py (26:46, 48%) - server/text_generation_server/utils/__init__.py (21:41, 57%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (350:371, 4%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (799:820, 2%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/segments.py (32:66, 55%) - server/text_generation_server/utils/segments.py (28:62, 60%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (102:121, 3%) - server/text_generation_server/layers/rotary.py (101:120, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (306:327, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (341:362, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (775:796, 2%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (375:396, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (95:119, 5%) - server/text_generation_server/layers/gptq/__init__.py (108:132, 5%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (467:492, 4%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (466:491, 4%) 20 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (299:320, 5%) - server/text_generation_server/layers/gptq/__init__.py (284:305, 5%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (605:628, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (622:645, 3%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (264:287, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (265:288, 2%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (392:417, 5%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (385:410, 5%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (508:526, 3%) - server/text_generation_server/utils/tokens.py (484:502, 3%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (522:540, 2%) - server/text_generation_server/models/__init__.py (696:714, 1%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (681:704, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (631:654, 3%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (321:342, 5%) - server/text_generation_server/layers/gptq/__init__.py (307:328, 5%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (328:353, 5%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (382:407, 4%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (334:355, 5%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (327:348, 5%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/__init__.py (2:30, 76%) - server/text_generation_server/layers/__init__.py (2:29, 79%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (265:288, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (264:287, 4%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (502:520, 2%) - server/text_generation_server/models/__init__.py (662:680, 1%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (7:31, 45%) - server/text_generation_server/layers/layernorm.py (10:34, 12%) 19 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (68:97, 14%) - server/text_generation_server/layers/attention/kv_cache.py (154:182, 7%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (76:96, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (80:100, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (214:234, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (112:130, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (18:38, 5%) - server/text_generation_server/layers/gptq/__init__.py (22:42, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (737:755, <1%) - server/text_generation_server/models/flash_causal_lm.py (738:756, <1%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (307:328, 5%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (317:338, 5%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (431:450, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (437:456, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (207:233, 4%) - server/text_generation_server/adapters/lora.py (219:245, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (300:325, 5%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (307:332, 5%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (304:323, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (307:326, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (453:478, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (488:513, 3%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (75:95, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (73:93, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2401:2420, <1%) - server/text_generation_server/models/flash_causal_lm.py (2304:2323, <1%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (11:65, 6%) - server/text_generation_server/utils/weights.py (13:67, 6%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (973:991, 2%) - server/text_generation_server/models/vlm_causal_lm.py (991:1009, 1%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (233:254, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (290:312, 4%) 18 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/hpu.py (34:52, 11%) - server/text_generation_server/layers/gptq/ipex.py (9:27, 16%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (378:399, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (388:409, 2%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (13:29, 16%) - server/text_generation_server/layers/moe/__init__.py (204:220, 7%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1978:1995, <1%) - server/text_generation_server/models/mllama_causal_lm.py (247:264, 5%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (496:515, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (501:520, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (280:299, 6%) - server/text_generation_server/server.py (290:309, 6%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (298:316, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (297:315, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (141:162, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (120:141, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (871:891, 2%) - server/text_generation_server/models/idefics_causal_lm.py (846:866, 2%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (339:358, 5%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (337:356, 5%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (244:261, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (277:294, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (196:213, 4%) - server/text_generation_server/layers/gptq/__init__.py (301:318, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/awq/quantize/hpu.py (93:114, 17%) - server/text_generation_server/layers/awq/quantize/ipex.py (7:28, 48%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (514:531, 3%) - server/text_generation_server/models/mllama_causal_lm.py (247:264, 5%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1142:1163, <1%) - server/text_generation_server/models/flash_causal_lm.py (1029:1050, <1%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (359:377, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (263:280, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (181:200, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (112:129, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (662:685, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (664:687, 2%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (297:315, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (298:316, 2%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (275:294, 5%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (411:430, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (214:233, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (192:211, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (258:275, 4%) - server/text_generation_server/layers/gptq/__init__.py (232:249, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (189:205, 8%) - server/text_generation_server/layers/moe/unquantized.py (19:35, 8%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (71:92, 6%) - server/text_generation_server/server.py (79:100, 6%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (386:405, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (411:430, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (386:405, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (329:348, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (203:220, 4%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (578:595, 2%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (579:598, 3%) - server/text_generation_server/layers/rotary.py (574:593, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1978:1995, <1%) - server/text_generation_server/models/flash_causal_lm.py (1770:1787, <1%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/awq/quantize/hpu.py (93:114, 17%) - server/text_generation_server/layers/awq/quantize/cuda.py (19:40, 68%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (361:379, 3%) - server/text_generation_server/layers/rotary.py (309:328, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (309:327, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:386, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (181:200, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (216:235, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (189:205, 8%) - server/text_generation_server/layers/moe/fp8.py (21:37, 11%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (359:377, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (344:362, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (244:261, 4%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (347:364, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (123:144, 4%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (166:187, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (114:132, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (25:43, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (275:294, 5%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (329:348, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (544:561, 2%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (238:255, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (279:297, 3%) - server/text_generation_server/layers/fp8.py (378:396, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (305:324, 3%) - server/text_generation_server/layers/rotary.py (362:380, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (532:552, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (557:577, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (21:37, 7%) - server/text_generation_server/layers/moe/__init__.py (204:220, 7%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (141:162, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (166:187, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (514:531, 3%) - server/text_generation_server/models/flash_causal_lm.py (1770:1787, <1%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (122:143, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (120:141, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (401:420, 4%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (444:463, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (309:327, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (263:280, 4%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (502:520, 3%) - server/text_generation_server/layers/fp8.py (219:237, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (122:143, 4%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (138:159, 3%) 17 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (123:144, 4%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (138:159, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (14:36, 3%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (12:33, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:706, 2%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (1137:1155, 1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (753:768, 1%) - server/text_generation_server/models/__init__.py (1309:1324, <1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (261:277, 4%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (325:341, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (753:768, 1%) - server/text_generation_server/models/__init__.py (1290:1305, <1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (188:204, 5%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:386, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (23:52, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (23:54, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (630:647, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (585:602, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (207:223, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (264:280, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (670:687, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (690:707, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (188:204, 5%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (264:280, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (554:571, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (585:602, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (452:469, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (484:501, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (128:145, 4%) - server/text_generation_server/layers/gptq/__init__.py (290:307, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (65:81, 3%) - server/text_generation_server/models/custom_modeling/siglip.py (25:40, 5%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (610:628, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (617:635, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (376:392, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:386, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (630:647, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (576:593, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (326:341, 1%) - server/text_generation_server/models/__init__.py (390:405, <1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (188:204, 5%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (346:362, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (378:394, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (235:251, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2480:2499, <1%) - server/text_generation_server/models/flash_causal_lm.py (2381:2400, <1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (247:264, 4%) - server/text_generation_server/layers/gptq/__init__.py (158:175, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (207:223, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:386, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:706, 2%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (578:596, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (255:272, 5%) - server/text_generation_server/cli.py (208:225, 5%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (247:264, 4%) - server/text_generation_server/layers/gptq/__init__.py (394:411, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (554:571, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (576:593, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (376:392, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (346:362, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (332:349, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (380:397, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:212, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:110, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (25:40, 5%) - server/text_generation_server/models/custom_modeling/idefics2.py (66:82, 2%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (265:281, 4%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (267:283, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (31:46, 8%) - server/text_generation_server/layers/moe/__init__.py (77:92, 7%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (321:337, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (265:281, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (396:413, 4%) - server/text_generation_server/layers/gptq/__init__.py (290:307, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (376:392, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (264:280, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (511:530, <1%) - server/text_generation_server/models/flash_causal_lm.py (507:526, <1%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (25:40, 5%) - server/text_generation_server/models/custom_modeling/idefics3.py (65:81, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (66:82, 2%) - server/text_generation_server/models/custom_modeling/siglip.py (25:40, 5%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (207:223, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (346:362, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (62:77, 8%) - server/text_generation_server/layers/moe/__init__.py (46:61, 7%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (374:391, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (371:388, 4%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (464:481, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (450:467, 3%) 16 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (205:222, 5%) - server/text_generation_server/cli.py (258:275, 5%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (662:678, 2%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (59:74, 15%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (200:218, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:243, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) - server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:482, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (473:494, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (200:218, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (254:272, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (96:115, 4%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (93:112, 4%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (277:296, 4%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (283:302, 4%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) - server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (870:886, 2%) - server/text_generation_server/models/mamba.py (782:798, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (566:590, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (579:603, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) - server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (394:415, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (407:428, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (173:191, 4%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (294:312, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (251:269, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (250:268, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (327:345, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (41:60, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (40:59, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (424:444, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (683:700, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) - server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/model.py (66:83, 15%) - server/text_generation_server/models/model.py (97:114, 11%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (366:386, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (416:436, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) - server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) - server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (683:700, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (424:444, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (32:52, 2%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (30:50, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:213, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (245:263, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (189:207, 4%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (121:139, 4%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (25:44, 4%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (66:85, 4%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (237:254, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (189:207, 4%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) - server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1506:1521, <1%) - server/text_generation_server/models/flash_causal_lm.py (1330:1345, <1%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (257:275, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (233:248, 2%) - server/text_generation_server/models/custom_modeling/siglip.py (164:179, 5%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (235:250, 3%) - server/text_generation_server/models/custom_modeling/idefics3.py (232:247, 3%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (200:218, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (336:354, 2%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (146:160, 6%) - server/text_generation_server/server.py (118:132, 6%) 15 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (220:238, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:220, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (46:68, 5%) - server/text_generation_server/server.py (56:76, 5%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (352:367, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (501:515, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (164:178, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:236, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (407:427, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (453:473, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (444:461, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (455:472, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:105, 4%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:316, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (244:258, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (393:406, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (164:178, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (116:130, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (576:591, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (491:505, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (294:308, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:236, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (225:240, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:236, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/chunks.py (8:27, 100%) - server/text_generation_server/utils/chunks.py (8:27, 100%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (315:331, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (191:207, 4%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (473:486, 2%) - server/text_generation_server/layers/rotary.py (475:488, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (468:482, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (501:515, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (294:307, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (254:267, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (84:100, 3%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (430:446, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (247:263, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (426:446, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (420:440, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (225:241, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (225:240, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (116:130, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (225:241, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (296:312, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (352:367, 4%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (579:594, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (39:57, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (52:70, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (497:511, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (491:505, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (305:320, 3%) - server/text_generation_server/layers/gptq/__init__.py (394:409, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (305:320, 3%) - server/text_generation_server/layers/gptq/__init__.py (158:173, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (25:49, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (26:50, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (190:204, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:316, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (296:310, 3%) - server/text_generation_server/models/custom_modeling/mllama.py (778:791, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (751:764, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (393:406, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (752:765, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:466, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (26:50, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (25:49, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (247:263, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (497:511, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (579:594, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (239:254, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (227:243, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (219:234, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:186, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:703, 2%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (721:734, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/config.py (14:30, 100%) - server/text_generation_server/adapters/config.py (14:30, 100%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:51, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:48, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (415:431, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (100:116, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (220:234, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:316, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (270:284, 3%) - server/text_generation_server/models/custom_modeling/mllama.py (778:791, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (297:315, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (301:319, 4%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (239:254, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (219:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (221:236, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/prefill_chunking.py (3:24, 100%) - server/text_generation_server/utils/prefill_chunking.py (3:24, 100%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (468:482, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (579:594, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (415:431, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (430:446, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (175:191, 4%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (227:243, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (188:203, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (232:248, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:236, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:206, 4%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (171:185, 4%) - server/text_generation_server/models/custom_modeling/mllama.py (778:791, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (225:241, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (175:191, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (247:263, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (227:243, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (751:764, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (347:361, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (757:771, <1%) - server/text_generation_server/models/flash_causal_lm.py (757:771, <1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (576:591, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (501:515, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (122:136, 4%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (239:253, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (380:394, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:401, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (586:600, 1%) - server/text_generation_server/models/__init__.py (885:899, <1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (352:367, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (491:505, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (315:331, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (296:312, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (236:249, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (308:321, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (225:241, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (191:207, 4%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (175:191, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (244:258, 3%) - server/text_generation_server/models/custom_modeling/mllama.py (778:791, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (751:764, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (277:291, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (315:331, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (227:243, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/__init__.py (8:22, 34%) - server/text_generation_server/utils/__init__.py (6:20, 40%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (393:406, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (778:791, 1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (834:848, 1%) - server/text_generation_server/models/__init__.py (1546:1560, <1%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (294:308, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (194:208, 3%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (239:254, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (325:341, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (11:28, 2%) - server/text_generation_server/layers/rotary.py (17:34, 2%) 14 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (84:100, 3%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (100:116, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (305:317, 5%) - server/text_generation_server/server.py (313:325, 5%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fused_moe.py (54:67, 13%) - server/text_generation_server/layers/moe/fused_moe_ipex.py (31:43, 31%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (291:303, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (197:209, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (171:186, 5%) - server/text_generation_server/server.py (191:206, 5%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (186:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (221:235, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (272:284, 3%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (164:177, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (197:211, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (73:90, 1%) - server/text_generation_server/models/__init__.py (119:136, <1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (615:628, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (641:654, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (547:559, 1%) - server/text_generation_server/models/__init__.py (761:773, <1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (284:296, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (227:239, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/loader.py (149:169, 12%) - server/text_generation_server/layers/compressed_tensors/loader.py (176:196, 10%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:222, 4%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (264:276, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (567:583, 2%) - server/text_generation_server/models/custom_modeling/llava_next.py (260:276, 6%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (432:445, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (279:291, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (260:272, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (228:240, 4%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (155:167, 6%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (136:148, 9%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (319:333, 4%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (393:407, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (39:53, 3%) - server/text_generation_server/layers/gptq/__init__.py (48:62, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (246:258, 3%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (394:406, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fused_moe.py (83:95, 13%) - server/text_generation_server/layers/moe/fused_moe_ipex.py (53:65, 31%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (186:200, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:185, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (222:234, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (335:347, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (542:554, 1%) - server/text_generation_server/models/vlm_causal_lm.py (537:549, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (372:387, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (308:323, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (228:243, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (235:250, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (365:378, 2%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/neuron/server/text_generation_server/interceptor.py (11:23, 68%) - server/text_generation_server/interceptor.py (15:27, 52%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (246:258, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (272:284, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (103:118, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (100:115, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (272:284, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (824:840, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (260:276, 6%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (752:764, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (246:258, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (225:239, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (197:211, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (432:445, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (394:406, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (394:406, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (394:406, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (372:387, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (308:323, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:171, 4%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (227:239, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (432:445, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (779:791, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (365:378, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (349:361, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (173:185, 4%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (211:226, 2%) - server/text_generation_server/layers/fp8.py (127:142, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (691:704, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:645, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (173:185, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (253:270, 2%) - server/text_generation_server/layers/rotary.py (251:268, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (432:445, 2%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (365:378, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (279:291, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (69:85, 2%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (54:70, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (298:310, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (31:43, 6%) - server/text_generation_server/layers/moe/gptq_marlin.py (61:73, 4%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/quantization.py (150:167, 10%) - server/text_generation_server/utils/quantization.py (204:221, 7%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (298:310, 3%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (453:465, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (502:516, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (393:407, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (365:378, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (779:791, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (260:276, 6%) - server/text_generation_server/models/custom_modeling/idefics2.py (809:825, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (335:347, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (294:306, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (173:185, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (249:263, 4%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (264:278, 4%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (365:378, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (394:406, 1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (217:231, 6%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (159:173, 9%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (62:74, 6%) - server/text_generation_server/layers/moe/gptq_marlin.py (61:73, 4%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (95:107, 5%) - server/text_generation_server/server.py (153:165, 5%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (95:107, 5%) - server/text_generation_server/server.py (118:130, 5%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (752:764, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (298:310, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (377:390, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (432:445, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (349:361, 3%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (734:747, 1%) - server/text_generation_server/models/__init__.py (1259:1272, <1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1461:1477, <1%) - server/text_generation_server/models/flash_causal_lm.py (1294:1310, <1%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (260:276, 6%) - server/text_generation_server/models/custom_modeling/idefics3.py (551:567, 2%) 13 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (335:347, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (294:306, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:178, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:208, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:185, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:233, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (167:178, 3%) - server/text_generation_server/layers/marlin/gptq.py (116:127, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:218, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (193:205, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:251, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (193:205, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (292:303, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (228:239, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (150:162, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (179:191, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:257, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (137:149, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:185, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:217, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:352, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (228:239, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (584:599, 1%) - server/text_generation_server/models/vlm_causal_lm.py (637:652, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (223:234, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:209, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (822:838, 1%) - server/text_generation_server/models/causal_lm.py (781:796, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (382:394, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (371:384, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:257, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (193:205, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/watermark.py (22:36, 18%) - server/text_generation_server/utils/watermark.py (22:36, 18%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (285:296, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:209, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (614:625, 1%) - server/text_generation_server/models/__init__.py (954:965, <1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (177:189, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (183:195, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (292:303, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:277, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (241:253, 5%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (178:190, 8%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (67:79, 5%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (178:190, 8%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (658:670, 1%) - server/text_generation_server/models/causal_lm.py (646:658, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:215, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:233, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (336:347, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (238:250, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (242:254, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (373:385, 2%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (822:834, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (130:143, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (110:123, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (520:538, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (549:567, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (819:831, 1%) - server/text_generation_server/models/__init__.py (1515:1527, <1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (241:253, 5%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (61:73, 8%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (132:145, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (110:123, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:240, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:257, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (243:255, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:195, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (193:205, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (469:480, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (569:580, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (395:407, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (418:430, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (71:96, 4%) - server/text_generation_server/utils/weights.py (65:90, 4%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (380:392, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:326, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:234, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:234, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:270, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:209, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (365:376, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (346:359, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (85:98, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (110:123, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:240, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:277, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (289:300, 2%) - server/text_generation_server/layers/rotary.py (296:307, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:352, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (596:614, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (558:576, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (311:323, 1%) - server/text_generation_server/models/vlm_causal_lm.py (302:314, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:233, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:217, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (223:234, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:277, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:218, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (137:149, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (340:353, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (394:406, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (382:394, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (340:353, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (365:377, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:326, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (223:234, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (223:234, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (208:220, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (242:254, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (223:234, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:195, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (243:255, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (342:353, 4%) - server/text_generation_server/utils/weights.py (219:230, 4%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (311:323, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (350:362, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (192:204, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:326, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (228:239, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (332:345, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (377:388, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (226:237, 4%) - server/text_generation_server/utils/weights.py (332:343, 4%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:178, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (54:67, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (98:111, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:316, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:185, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:189, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (666:678, 1%) - server/text_generation_server/models/__init__.py (1073:1085, <1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:208, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (644:659, 1%) - server/text_generation_server/models/vlm_causal_lm.py (575:590, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (340:358, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (345:363, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (822:838, 1%) - server/text_generation_server/models/mamba.py (731:745, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (238:250, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (219:231, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (85:97, 6%) - server/text_generation_server/layers/lora.py (91:103, 6%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (187:199, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (798:810, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (398:410, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (113:126, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (129:142, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (211:223, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:326, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (113:126, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (85:98, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:270, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:240, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:316, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (427:439, 2%) - server/text_generation_server/layers/fp8.py (304:316, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (200:215, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (230:245, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:240, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:208, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (846:858, 1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (841:853, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (109:121, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (242:254, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (424:438, 3%) - server/text_generation_server/layers/marlin/gptq.py (235:249, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:234, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:316, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:195, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (137:149, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:352, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/vlm.py (1:17, 25%) - server/text_generation_server/models/custom_modeling/vlm.py (1:17, 25%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:251, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (243:255, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:86, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:233, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (160:171, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:352, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (266:277, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (160:171, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (285:296, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (285:296, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (160:171, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:209, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (292:303, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:251, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (137:149, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (211:222, 3%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (325:336, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (217:229, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (566:577, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (508:519, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (376:388, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (387:399, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (315:327, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:326, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:234, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:240, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (680:692, 1%) - server/text_generation_server/models/__init__.py (1108:1120, <1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:208, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (160:171, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (488:500, 3%) - server/text_generation_server/utils/logits_process.py (493:505, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (238:250, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (191:203, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:316, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (346:364, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (385:403, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (319:332, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (394:406, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (187:199, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (292:303, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (336:347, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:208, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (113:126, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (127:140, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (88:100, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (341:352, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (336:347, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:270, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (304:315, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:270, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (534:548, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (545:559, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (217:229, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (98:109, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (112:123, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (340:353, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (239:251, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (311:323, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (374:386, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:186, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (319:332, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (239:251, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (199:210, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (198:209, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:105, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:178, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:308, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:130, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (259:270, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (228:239, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:220, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (311:323, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (268:280, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (321:332, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (229:240, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:159, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:236, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (292:303, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (353:364, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:178, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:316, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:204, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:268, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (822:838, 1%) - server/text_generation_server/models/idefics_causal_lm.py (809:824, 1%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (190:205, 9%) - server/text_generation_server/layers/attention/kv_cache.py (310:325, 4%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:218, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (243:255, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:178, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:161, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (88:100, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (247:259, 2%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (285:296, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (206:217, 3%) 12 duplicated lines in: - backends/gaudi/server/text_generation_server/models/model.py (84:98, 12%) - server/text_generation_server/models/model.py (118:132, 9%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (157:167, 5%) - server/text_generation_server/layers/fp8.py (322:332, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (160:170, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (163:173, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (334:344, 3%) - server/text_generation_server/adapters/lora.py (377:387, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (462:474, 2%) - server/text_generation_server/layers/fp8.py (225:237, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (515:527, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (423:435, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (514:525, 2%) - server/text_generation_server/models/vlm_causal_lm.py (991:1002, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (212:223, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (163:176, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (242:252, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (193:204, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (381:392, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (973:984, 1%) - server/text_generation_server/models/mllama_causal_lm.py (247:258, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (312:323, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (462:474, 2%) - server/text_generation_server/layers/fp8.py (384:396, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (722:732, 1%) - server/text_generation_server/models/__init__.py (1225:1235, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (396:407, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (351:362, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (76:88, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (189:200, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (920:931, 1%) - server/text_generation_server/models/__init__.py (1672:1683, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (112:122, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (134:144, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:29, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:47, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1607:1619, <1%) - server/text_generation_server/models/flash_causal_lm.py (1523:1535, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (112:122, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (135:145, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (377:388, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (351:362, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (530:540, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (519:529, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (309:321, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (512:524, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (124:139, 10%) - server/text_generation_server/layers/moe/unquantized.py (119:134, 5%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (407:420, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (507:520, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (390:400, 2%) - server/text_generation_server/layers/fp8.py (322:332, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (360:370, 3%) - server/text_generation_server/adapters/lora.py (352:362, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (329:342, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (573:583, 1%) - server/text_generation_server/models/__init__.py (849:859, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (404:415, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (751:762, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (366:377, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (163:176, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (213:223, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (238:248, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:179, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (160:170, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (163:173, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (457:469, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (376:388, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (252:265, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:104, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:215, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:141, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (375:386, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (392:403, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (212:223, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:139, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:189, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (396:407, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (375:386, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (502:515, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (450:463, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (613:625, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (638:650, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (54:64, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (60:70, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (89:100, 5%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (86:97, 5%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (193:204, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (485:497, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (263:274, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (503:515, 2%) - server/text_generation_server/utils/logits_process.py (509:521, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/interceptor.py (16:26, 44%) - server/text_generation_server/interceptor.py (15:25, 44%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (845:856, 1%) - server/text_generation_server/layers/gptq/quantize.py (813:824, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (55:65, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (51:61, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (596:606, 1%) - server/text_generation_server/models/idefics_causal_lm.py (659:669, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (220:231, 3%) - server/text_generation_server/layers/marlin/gptq.py (154:165, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (542:553, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (493:504, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (735:746, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (392:403, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (377:388, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (315:326, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (309:321, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (521:533, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (285:297, 2%) - server/text_generation_server/layers/fp8.py (343:355, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (297:309, 2%) - server/text_generation_server/models/custom_modeling/siglip.py (356:367, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:200, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (224:235, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (188:200, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (227:240, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (356:367, 3%) - server/text_generation_server/models/custom_modeling/idefics3.py (297:309, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:48, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:47, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (794:804, 1%) - server/text_generation_server/models/__init__.py (1405:1415, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (359:371, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (521:533, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (445:455, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (447:457, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (248:260, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (252:264, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (539:549, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (561:571, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1526:1536, <1%) - server/text_generation_server/models/flash_causal_lm.py (1347:1357, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (188:200, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (338:351, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1032:1043, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (180:191, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (782:792, 1%) - server/text_generation_server/models/__init__.py (1371:1381, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (312:323, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (539:549, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (438:448, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (561:573, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (344:356, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:48, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:47, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:185, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:141, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:272, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (469:481, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (376:388, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1978:1989, <1%) - server/text_generation_server/models/vlm_causal_lm.py (991:1002, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:180, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (118:129, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:48, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:27, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (404:415, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:392, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:391, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (489:501, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (381:392, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (359:371, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (512:524, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:139, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:217, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (485:497, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:380, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (654:664, 1%) - server/text_generation_server/models/__init__.py (995:1005, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (202:215, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (654:664, 1%) - server/text_generation_server/models/__init__.py (1046:1056, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (321:332, 3%) - server/text_generation_server/layers/gptq/__init__.py (238:249, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (973:984, 1%) - server/text_generation_server/models/flash_causal_lm.py (1770:1781, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (135:145, 1%) - server/text_generation_server/models/custom_modeling/clip.py (112:122, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (222:235, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (432:444, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (546:558, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1032:1043, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (184:195, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (241:255, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (237:251, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:200, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:160, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (947:957, <1%) - server/text_generation_server/models/flash_causal_lm.py (675:685, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (400:412, 2%) - server/text_generation_server/layers/fp8.py (343:355, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (400:412, 2%) - server/text_generation_server/layers/fp8.py (384:396, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (400:412, 2%) - server/text_generation_server/layers/fp8.py (225:237, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (316:327, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (208:218, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:179, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (889:901, 1%) - server/text_generation_server/models/__init__.py (1610:1622, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (561:571, 1%) - server/text_generation_server/models/__init__.py (813:823, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/hpu.py (34:44, 6%) - server/text_generation_server/layers/gptq/triton.py (248:258, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:49, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:47, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (813:824, 1%) - server/text_generation_server/layers/gptq/quantize.py (845:856, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (377:388, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (375:386, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (390:400, 2%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (138:148, 7%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:158, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (396:407, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (269:280, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (316:326, 1%) - server/text_generation_server/models/__init__.py (370:380, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (561:573, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (263:274, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:200, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:267, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:200, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (304:315, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:29, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:47, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (109:119, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:179, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (396:407, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (315:326, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (524:536, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (546:558, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (123:136, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (173:183, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (163:173, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (298:310, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (356:367, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (366:377, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:399, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (253:266, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (316:327, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:430, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:180, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (108:119, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:457, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (519:529, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:139, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:233, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (806:816, 1%) - server/text_generation_server/models/__init__.py (1441:1451, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (95:110, 10%) - server/text_generation_server/layers/moe/unquantized.py (148:163, 5%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (196:207, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (508:520, 2%) - server/text_generation_server/layers/fp8.py (343:355, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (296:307, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (530:540, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (438:448, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (134:144, 2%) - server/text_generation_server/models/custom_modeling/clip.py (112:122, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (735:746, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:392, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (539:552, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (417:430, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (197:210, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:203, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (485:497, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (344:356, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (188:200, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (204:217, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (627:637, 1%) - server/text_generation_server/models/__init__.py (995:1005, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (356:367, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (298:310, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (76:88, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (217:228, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (627:637, 1%) - server/text_generation_server/models/__init__.py (1046:1056, <1%) 11 duplicated lines in: - backends/neuron/server/text_generation_server/cli.py (84:99, 17%) - server/text_generation_server/cli.py (144:155, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (432:444, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (504:516, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (457:469, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (455:467, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (281:294, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (564:577, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:391, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (455:467, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:457, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (561:571, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:47, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:46, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (515:527, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (504:516, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (524:536, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (423:435, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (466:477, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (502:513, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (735:745, 1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (557:567, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (770:780, 1%) - server/text_generation_server/models/__init__.py (1337:1347, <1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (392:405, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (564:577, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (469:481, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (489:501, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (134:146, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (45:57, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (173:183, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (163:173, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:185, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:141, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (377:388, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (269:280, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (561:573, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:380, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (375:386, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (751:762, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (222:233, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (192:203, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (188:200, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (256:269, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:49, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:27, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:86, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:141, 3%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (539:552, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (335:348, 2%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:219, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:211, 1%) 11 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (602:612, 1%) - server/text_generation_server/models/__init__.py (931:941, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (78:88, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (247:256, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:206, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (143:152, 3%) - server/text_generation_server/cli.py (73:82, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:347, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (156:165, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (283:292, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:277, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (247:257, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:254, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (340:350, 1%) - server/text_generation_server/layers/fp8.py (345:355, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (490:499, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (340:350, 1%) - server/text_generation_server/layers/fp8.py (386:396, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (1477:1486, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:212, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:101, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (416:427, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (387:397, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:296, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (328:338, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (228:237, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (128:137, 3%) - server/text_generation_server/models/custom_modeling/clip.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (340:350, 1%) - server/text_generation_server/layers/fp8.py (227:237, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:132, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:214, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (520:530, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (546:556, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (41:57, 1%) - server/text_generation_server/models/__init__.py (83:99, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:121, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (139:149, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (93:104, 3%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (551:562, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (347:358, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (235:244, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1241:1253, <1%) - server/text_generation_server/models/flash_causal_lm.py (1115:1127, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/hpu.py (157:167, 6%) - server/text_generation_server/layers/gptq/triton.py (325:335, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:35, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:35, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:220, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (139:149, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:277, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (274:287, 1%) - server/text_generation_server/layers/rotary.py (282:295, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:220, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (245:255, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:101, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (188:198, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (523:533, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:347, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (448:458, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (636:646, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:327, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:254, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (718:728, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (461:471, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (508:517, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (393:402, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (43:55, 23%) - server/text_generation_server/layers/layernorm.py (101:113, 6%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:171, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:296, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (72:82, 5%) - server/text_generation_server/layers/lora.py (78:88, 5%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (57:69, 5%) - server/text_generation_server/layers/lora.py (63:75, 5%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:82, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:140, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:250, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:205, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (307:317, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (228:237, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:140, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/neuron/server/text_generation_server/cli.py (90:99, 15%) - server/text_generation_server/cli.py (73:82, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:171, 3%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (448:457, <1%) - server/text_generation_server/models/flash_causal_lm.py (934:943, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (36:47, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:52, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (251:260, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (191:200, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (941:955, 1%) - server/text_generation_server/models/__init__.py (1794:1808, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (386:395, 1%) - server/text_generation_server/layers/gptq/quantize.py (418:427, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:296, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:220, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:205, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (36:48, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (35:47, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (448:457, <1%) - server/text_generation_server/models/flash_causal_lm.py (675:684, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (386:395, 1%) - server/text_generation_server/layers/gptq/quantize.py (518:527, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:82, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:206, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:250, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (245:255, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (578:587, 1%) - server/text_generation_server/models/idefics_causal_lm.py (642:651, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (268:277, 2%) - server/text_generation_server/layers/gptq/__init__.py (413:422, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:347, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:327, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (139:149, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:212, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:206, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (587:596, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (573:583, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (31:40, 5%) - server/text_generation_server/layers/moe/unquantized.py (19:28, 5%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (287:297, 1%) - server/text_generation_server/layers/fp8.py (277:287, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (185:195, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:254, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:204, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:140, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:270, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (93:104, 3%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (173:184, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (188:198, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (514:524, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (464:474, 1%) - server/text_generation_server/layers/fp8.py (277:287, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (568:580, <1%) - server/text_generation_server/models/flash_causal_lm.py (566:578, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (325:334, 2%) - server/text_generation_server/layers/gptq/__init__.py (177:186, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (325:334, 2%) - server/text_generation_server/layers/gptq/__init__.py (413:422, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (787:796, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:347, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (251:260, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (219:228, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:277, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (275:284, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (157:166, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:206, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:270, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:277, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (13:22, 9%) - server/text_generation_server/layers/moe/gptq_marlin.py (61:70, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (268:277, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (347:358, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (390:399, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:204, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:214, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:250, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (139:149, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (415:424, 2%) - server/text_generation_server/layers/gptq/__init__.py (311:320, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:82, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:101, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (250:260, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (548:559, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (108:118, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (113:122, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (82:91, 7%) - server/text_generation_server/layers/medusa.py (121:130, 7%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (189:198, 5%) - server/text_generation_server/layers/moe/__init__.py (77:86, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (189:198, 5%) - server/text_generation_server/layers/moe/__init__.py (46:55, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1641:1650, <1%) - server/text_generation_server/models/flash_causal_lm.py (1582:1592, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:132, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:186, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (688:698, <1%) - server/text_generation_server/models/flash_causal_lm.py (693:703, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (62:71, 5%) - server/text_generation_server/layers/moe/fp8.py (21:30, 6%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (537:548, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (254:264, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (121:130, 7%) - server/text_generation_server/layers/medusa.py (82:91, 7%) 10 duplicated lines in: - backends/neuron/server/text_generation_server/cli.py (52:61, 15%) - server/text_generation_server/cli.py (146:155, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (947:956, <1%) - server/text_generation_server/models/flash_causal_lm.py (445:454, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (376:386, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (523:533, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (31:40, 5%) - server/text_generation_server/layers/moe/fp8.py (21:30, 6%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (276:286, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (274:284, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (62:71, 5%) - server/text_generation_server/layers/moe/__init__.py (204:213, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (560:571, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:456, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (230:239, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (439:450, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (582:593, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:46, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (35:46, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (241:251, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:254, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (402:412, 1%) - server/text_generation_server/layers/fp8.py (277:287, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:39, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:39, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (189:198, 5%) - server/text_generation_server/layers/moe/gptq_marlin.py (61:70, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (61:70, 4%) - server/text_generation_server/layers/moe/fp8.py (51:60, 6%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:121, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (245:255, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:270, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1230:1239, <1%) - server/text_generation_server/models/flash_causal_lm.py (1104:1113, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (62:71, 5%) - server/text_generation_server/layers/moe/unquantized.py (19:28, 5%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:132, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:206, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (449:458, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (443:452, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (207:217, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (523:533, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (21:30, 4%) - server/text_generation_server/layers/moe/__init__.py (77:86, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:140, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (21:30, 4%) - server/text_generation_server/layers/moe/__init__.py (46:55, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:327, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:205, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (268:277, 2%) - server/text_generation_server/layers/gptq/__init__.py (177:186, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (263:272, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (113:123, 4%) - server/text_generation_server/layers/fp8.py (268:278, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (608:617, 1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (236:245, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (85:97, 1%) - server/text_generation_server/layers/rotary.py (87:99, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (266:277, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (228:237, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (690:699, 1%) - server/text_generation_server/models/custom_modeling/t5_modeling.py (828:837, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:121, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:205, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (338:347, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (651:660, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (674:683, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (128:137, 3%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (203:212, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (339:349, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (425:436, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (331:341, 1%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (101:111, 6%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (541:550, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (151:160, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (78:88, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (247:256, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (208:217, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:270, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:182, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:101, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:296, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (341:352, 1%) - server/text_generation_server/models/__init__.py (411:422, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:39, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:35, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (150:159, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:138, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:212, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:140, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (287:296, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (231:240, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (376:386, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (514:524, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (21:30, 4%) - server/text_generation_server/layers/moe/gptq_marlin.py (61:70, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:327, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (245:255, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/__init__.py (31:40, 5%) - server/text_generation_server/layers/moe/__init__.py (204:213, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (378:387, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (361:372, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (798:807, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (114:123, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:171, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (174:185, 2%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (232:243, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (201:210, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1548:1557, <1%) - server/text_generation_server/models/flash_causal_lm.py (1358:1367, <1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:179, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (202:211, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/tokens.py (259:270, 1%) - server/text_generation_server/utils/tokens.py (251:261, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (648:658, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (448:458, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (306:315, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:364, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/tensor_parallel.py (92:103, 5%) - server/text_generation_server/layers/tensor_parallel.py (98:109, 5%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (465:477, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (426:438, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:171, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (65:74, 3%) - server/text_generation_server/cli.py (146:155, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:35, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:39, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (200:209, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (623:634, 1%) - server/text_generation_server/models/seq2seq_lm.py (641:652, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (323:332, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:204, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:230, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:132, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:230, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (461:471, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (718:728, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (343:352, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (261:270, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:35, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:35, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (200:209, 2%) - server/text_generation_server/models/custom_modeling/siglip.py (128:137, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (281:290, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (267:276, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (255:265, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (274:284, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (207:217, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (514:524, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:39, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:35, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (518:527, 1%) - server/text_generation_server/layers/gptq/quantize.py (418:427, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (518:527, 1%) - server/text_generation_server/layers/gptq/quantize.py (386:395, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (134:144, 3%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (173:183, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (510:520, 1%) - server/text_generation_server/layers/fp8.py (277:287, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:132, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:101, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (162:171, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (208:218, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:254, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (327:336, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (172:182, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:148, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (213:222, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (439:450, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (591:602, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:204, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:186, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (541:550, 1%) - server/text_generation_server/models/causal_lm.py (501:510, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (418:427, 1%) - server/text_generation_server/layers/gptq/quantize.py (518:527, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (636:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:456, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (418:427, 1%) - server/text_generation_server/layers/gptq/quantize.py (386:395, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (13:22, 9%) - server/text_generation_server/layers/moe/__init__.py (46:55, 4%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (13:22, 9%) - server/text_generation_server/layers/moe/__init__.py (77:86, 4%) 10 duplicated lines in: - backends/neuron/server/text_generation_server/cli.py (52:61, 15%) - server/text_generation_server/cli.py (73:82, 3%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (384:393, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (333:342, 1%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (225:234, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (302:311, 2%) 10 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (398:410, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (426:438, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (525:533, 1%) - server/text_generation_server/models/flash_causal_lm.py (1731:1739, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (245:253, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (216:225, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (525:533, 1%) - server/text_generation_server/models/vlm_causal_lm.py (960:968, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (195:203, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:221, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (193:201, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:170, 6%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:362, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (421:430, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (313:324, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (373:384, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (411:420, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (447:456, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (421:430, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:230, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (377:386, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (390:398, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (453:462, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (266:275, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (418:427, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (550:559, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (356:365, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (47:56, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (43:52, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (379:388, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (41:52, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (35:46, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (195:204, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:323, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (317:326, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (297:307, 1%) - server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (844:852, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (831:840, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (411:420, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (593:602, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:377, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:186, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (140:149, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (230:239, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (36:47, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (40:51, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (148:158, 3%) - server/text_generation_server/models/custom_modeling/clip.py (219:229, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:221, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (243:251, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (453:462, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (372:381, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (606:616, <1%) - server/text_generation_server/models/flash_causal_lm.py (619:629, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (317:326, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (617:625, 1%) - server/text_generation_server/layers/fp8.py (489:497, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:230, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (174:183, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (105:114, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (145:154, 4%) - server/text_generation_server/models/custom_modeling/idefics3.py (462:471, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:221, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (137:145, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (356:364, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (312:320, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (398:407, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (219:229, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (148:158, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (72:80, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:98, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (668:676, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (206:214, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (250:259, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:214, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (396:405, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (492:501, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:377, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:230, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (269:278, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (230:239, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:132, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (562:570, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (587:596, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:214, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (76:84, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (80:88, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (554:563, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (544:552, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (377:386, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (554:563, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (461:469, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (230:239, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (583:597, <1%) - server/text_generation_server/models/flash_causal_lm.py (582:596, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (639:647, <1%) - server/text_generation_server/models/flash_causal_lm.py (909:917, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (383:392, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1177:1187, <1%) - server/text_generation_server/models/flash_causal_lm.py (1053:1063, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (279:288, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (153:162, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (105:114, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (215:232, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (337:351, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (418:427, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (255:264, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (379:388, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (247:255, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:179, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (539:548, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (388:397, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (30:38, 1%) - server/text_generation_server/layers/rotary.py (36:44, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (684:694, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (80:90, 9%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (298:308, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (269:278, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (280:289, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:230, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (280:289, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (831:840, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:186, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (340:349, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (255:264, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (562:571, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (511:520, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (343:355, 1%) - server/text_generation_server/models/causal_lm.py (317:329, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:214, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (183:191, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (216:225, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (139:147, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (70:78, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (90:98, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (390:399, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (318:327, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (382:391, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (339:348, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (506:515, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (584:593, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (70:78, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:98, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (245:253, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:323, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (251:260, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (427:436, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (29:37, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (156:164, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1989:1997, <1%) - server/text_generation_server/models/flash_causal_lm.py (1731:1739, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (208:216, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:179, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (367:378, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (323:334, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (938:946, <1%) - server/text_generation_server/models/flash_causal_lm.py (664:672, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (149:157, 6%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (80:88, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (460:469, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (339:348, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (431:440, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (270:279, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (279:288, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (398:407, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (390:399, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (711:720, <1%) - server/text_generation_server/models/__init__.py (1674:1683, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:186, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (554:563, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (587:596, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (396:405, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:388, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (131:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (123:132, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:221, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (242:250, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:132, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:132, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (307:315, 3%) - server/text_generation_server/cli.py (120:128, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:95, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:132, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (734:743, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (476:485, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (468:476, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (544:552, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (462:471, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (145:154, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (719:728, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (145:154, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (379:388, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (396:405, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (458:467, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (83:91, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (80:88, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (562:571, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (454:463, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (441:449, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (475:483, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (562:570, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (544:552, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (99:107, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (69:77, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:214, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (216:225, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (460:469, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (568:577, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (441:450, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (511:520, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (271:280, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (280:289, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/log.py (5:15, 100%) - server/text_generation_server/utils/log.py (5:15, 100%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (411:420, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (584:593, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:132, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (238:246, 1%) - server/text_generation_server/layers/rotary.py (134:142, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (271:280, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (472:481, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (421:430, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (135:143, 1%) - server/text_generation_server/layers/rotary.py (236:244, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (214:223, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (105:114, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (317:326, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (472:481, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (568:577, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (383:392, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (468:476, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (587:596, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (241:249, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:179, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:128, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:93, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (506:515, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (593:602, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (766:776, 1%) - server/text_generation_server/models/causal_lm.py (725:735, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (318:327, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (43:52, 3%) - server/text_generation_server/models/custom_modeling/clip.py (47:56, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:95, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:132, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (298:308, 1%) - server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:323, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/neuron/server/text_generation_server/server.py (71:81, 15%) - server/text_generation_server/server.py (299:309, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (251:260, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (388:397, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1989:1997, <1%) - server/text_generation_server/models/vlm_causal_lm.py (960:968, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (340:349, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (550:559, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (204:212, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (656:664, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:141, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:93, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:214, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (922:931, <1%) - server/text_generation_server/models/__init__.py (1076:1085, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (922:931, <1%) - server/text_generation_server/models/__init__.py (1111:1120, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (239:247, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (216:225, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (641:654, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (668:681, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:186, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (368:377, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (177:185, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (167:175, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (195:204, 3%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (539:548, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (427:436, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (711:720, <1%) - server/text_generation_server/models/__init__.py (1076:1085, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (711:720, <1%) - server/text_generation_server/models/__init__.py (1111:1120, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (270:279, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (280:289, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:368, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:171, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (185:193, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:179, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (124:139, 4%) - server/text_generation_server/layers/mlp.py (217:232, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:96, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:132, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (214:223, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (245:253, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (878:886, <1%) - server/text_generation_server/models/__init__.py (1582:1590, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (190:200, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (225:235, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:132, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (80:90, 9%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (779:789, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (83:91, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (150:158, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:141, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:100, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (666:677, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (692:703, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (353:362, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (243:254, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (246:257, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (117:125, 3%) - server/text_generation_server/server.py (267:275, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (149:157, 6%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (80:88, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (195:204, 3%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (209:217, 4%) - server/text_generation_server/layers/fp8.py (324:332, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:334, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (766:776, 1%) - server/text_generation_server/models/mamba.py (675:685, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (683:692, <1%) - server/text_generation_server/models/__init__.py (1674:1683, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (669:678, <1%) - server/text_generation_server/models/__init__.py (1674:1683, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:307, 1%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (75:83, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (922:930, <1%) - server/text_generation_server/models/flash_causal_lm.py (650:658, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (71:79, 2%) - server/text_generation_server/layers/marlin/gptq.py (60:68, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (390:399, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (86:94, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (67:75, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:214, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (269:278, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (279:288, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:82, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (73:81, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (156:164, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (149:157, 6%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (73:81, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (318:327, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:82, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (83:91, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (73:81, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (75:83, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (150:158, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (280:289, 4%) - server/text_generation_server/models/custom_modeling/llava_next.py (282:291, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (669:678, <1%) - server/text_generation_server/models/__init__.py (1111:1120, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:230, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (202:210, 3%) - server/text_generation_server/models/__init__.py (1803:1811, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (178:186, 1%) - server/text_generation_server/models/vlm_causal_lm.py (527:535, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (221:231, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (194:204, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (294:303, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (250:259, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (212:221, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (218:226, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (220:228, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (81:89, 4%) - server/text_generation_server/layers/fp8.py (239:247, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:96, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:132, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (86:94, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (69:77, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (382:391, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (568:577, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (99:107, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (67:75, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (76:84, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (150:158, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:128, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:100, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (145:154, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (719:728, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (460:469, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (421:430, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (385:394, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (353:362, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (382:391, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (421:430, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (356:365, 3%) - server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:140, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (264:273, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (140:149, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (279:288, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (568:576, 1%) - server/text_generation_server/layers/rotary.py (564:572, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (683:692, <1%) - server/text_generation_server/models/__init__.py (1076:1085, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (562:570, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (461:469, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (453:462, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (348:357, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1989:1997, <1%) - server/text_generation_server/models/mllama_causal_lm.py (216:224, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (285:294, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:388, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (324:335, <1%) - server/text_generation_server/models/flash_causal_lm.py (288:299, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (433:442, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (383:392, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:176, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (244:252, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (271:280, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (477:486, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (733:742, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (543:552, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (458:467, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (117:125, 3%) - server/text_generation_server/server.py (315:323, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (246:258, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (309:321, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:82, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:199, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (638:647, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (454:463, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:182, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (307:315, 3%) - server/text_generation_server/server.py (267:275, 3%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (844:852, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (282:291, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:138, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/quantization.py (142:150, 7%) - server/text_generation_server/utils/quantization.py (163:171, 5%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (75:83, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (80:88, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (353:362, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (441:450, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (454:463, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (532:540, 1%) - server/text_generation_server/models/mllama_causal_lm.py (156:164, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (209:217, 4%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (140:148, 6%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (72:80, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (90:98, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (241:250, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:311, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (653:661, <1%) - server/text_generation_server/models/flash_causal_lm.py (925:933, <1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:82, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (468:476, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (461:469, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:161, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:101, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (285:294, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (492:501, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (366:374, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (359:367, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (377:386, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (137:147, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (144:154, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (421:430, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (112:120, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (70:78, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (441:450, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:159, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:186, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (525:533, 1%) - server/text_generation_server/models/mllama_causal_lm.py (216:224, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (454:462, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (441:449, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (285:294, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (458:467, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (140:149, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (280:289, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (398:407, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (269:278, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (217:232, 4%) - server/text_generation_server/layers/mlp.py (124:139, 4%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (343:355, 1%) - server/text_generation_server/models/mamba.py (332:344, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:325, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:179, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:67, 3%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:206, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (270:279, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (230:239, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (543:552, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:388, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (638:647, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (511:520, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (506:515, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (447:456, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:136, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (254:263, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (392:401, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:195, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (472:481, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (339:348, 2%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (401:410, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (297:307, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (543:552, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (492:501, 1%) 9 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (239:248, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (245:254, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/kernels.py (9:22, 100%) - server/text_generation_server/utils/kernels.py (9:22, 100%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (750:757, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (651:658, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (378:386, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (334:341, 2%) - server/text_generation_server/adapters/lora.py (364:371, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (334:341, 2%) - server/text_generation_server/adapters/lora.py (389:396, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (836:843, <1%) - server/text_generation_server/models/__init__.py (1517:1524, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (83:93, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (120:130, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (412:419, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (134:141, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (113:121, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (256:263, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (255:262, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (477:485, <1%) - server/text_generation_server/models/causal_lm.py (80:88, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (416:423, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (440:447, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:99, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/hpu.py (73:80, 4%) - server/text_generation_server/layers/attention/cuda.py (228:235, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (390:397, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (660:667, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (416:423, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (581:588, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (986:993, <1%) - server/text_generation_server/models/vlm_causal_lm.py (961:968, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (821:828, <1%) - server/text_generation_server/models/__init__.py (1548:1555, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (205:212, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (277:285, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/hpu.py (73:80, 4%) - server/text_generation_server/layers/attention/rocm.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (419:426, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (409:416, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2060:2067, <1%) - server/text_generation_server/models/flash_causal_lm.py (1998:2005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (922:930, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (82:90, 1%) - server/text_generation_server/models/flash_causal_lm.py (470:478, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (267:275, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (283:291, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (165:173, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (190:198, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (84:91, 6%) - server/text_generation_server/layers/mlp.py (265:272, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (496:503, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (409:416, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (86:93, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (71:78, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (113:120, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (111:118, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (530:537, <1%) - server/text_generation_server/models/__init__.py (670:677, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (986:993, <1%) - server/text_generation_server/models/mllama_causal_lm.py (217:224, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (407:415, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (515:522, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (409:416, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (602:609, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (472:479, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (680:688, 1%) - server/text_generation_server/models/custom_modeling/bloom_modeling.py (880:888, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (74:81, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (130:137, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (697:704, <1%) - server/text_generation_server/models/__init__.py (1674:1682, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (416:423, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (572:579, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (701:709, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (817:825, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (595:602, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (497:504, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (696:704, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (337:345, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (226:233, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (697:704, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (637:647, 1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (85:95, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:138, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (360:367, 2%) - server/text_generation_server/adapters/lora.py (364:371, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (173:183, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (241:251, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (360:367, 2%) - server/text_generation_server/adapters/lora.py (389:396, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (133:140, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (71:78, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (966:973, <1%) - server/text_generation_server/server.py (269:276, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (67:74, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (63:70, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (419:426, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (497:504, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (701:709, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (268:276, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (285:293, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (288:296, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (180:190, 1%) - server/text_generation_server/models/idefics_causal_lm.py (233:243, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (576:584, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (105:113, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (131:138, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (372:379, 2%) - server/text_generation_server/adapters/lora.py (352:359, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (372:379, 2%) - server/text_generation_server/adapters/lora.py (377:384, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (372:379, 2%) - server/text_generation_server/adapters/lora.py (364:371, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (696:704, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (595:602, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (409:416, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:639, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (533:540, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (279:291, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (296:308, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (128:135, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (152:159, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (307:315, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (428:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (750:757, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (398:405, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1369:1376, <1%) - server/text_generation_server/models/seq2seq_lm.py (543:550, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (643:650, <1%) - server/text_generation_server/models/__init__.py (1076:1084, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (237:244, 3%) - server/text_generation_server/server.py (256:263, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (643:650, <1%) - server/text_generation_server/models/__init__.py (1111:1119, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (716:723, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (198:206, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (392:399, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (436:443, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (492:499, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (533:540, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (123:130, 6%) - server/text_generation_server/layers/mlp.py (265:272, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (492:499, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (660:667, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (319:326, 2%) - server/text_generation_server/utils/weights.py (312:319, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (228:235, 1%) - server/text_generation_server/models/mamba.py (239:246, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (86:93, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (157:164, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:180, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (477:485, <1%) - server/text_generation_server/models/mamba.py (120:128, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (935:942, <1%) - server/text_generation_server/models/__init__.py (1702:1709, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (83:90, 7%) - server/text_generation_server/layers/moe/fp8.py (143:150, 5%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:664, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (136:144, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (162:170, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (152:159, 1%) - server/text_generation_server/models/custom_modeling/clip.py (128:135, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (906:913, <1%) - server/text_generation_server/models/__init__.py (1111:1119, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (906:913, <1%) - server/text_generation_server/models/__init__.py (1076:1084, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (407:418, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (420:431, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (298:307, <1%) - server/text_generation_server/models/vlm_causal_lm.py (289:298, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (94:105, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (38:49, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (327:335, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (471:480, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (426:437, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (453:464, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (492:499, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (768:775, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (541:549, 1%) - server/text_generation_server/models/mllama_causal_lm.py (306:314, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:20, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:20, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (906:913, <1%) - server/text_generation_server/models/__init__.py (1674:1682, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (114:121, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (157:164, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2344:2351, <1%) - server/text_generation_server/models/flash_causal_lm.py (1935:1942, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/hpu.py (73:80, 4%) - server/text_generation_server/layers/attention/ipex.py (17:24, 5%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (74:81, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (86:93, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (390:397, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (533:540, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (737:745, <1%) - server/text_generation_server/models/__init__.py (1076:1084, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (737:745, <1%) - server/text_generation_server/models/__init__.py (1111:1119, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) - server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (583:592, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (535:544, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (620:628, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:860, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (131:138, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (157:164, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (711:719, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:210, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (933:941, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (962:969, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:204, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (906:913, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (750:757, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (768:775, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (647:654, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (650:657, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (492:499, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (651:658, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (128:135, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (151:158, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (122:132, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (80:90, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (206:213, 2%) - server/text_generation_server/layers/gptq/__init__.py (177:184, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:169, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:90, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:212, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) - server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) - server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (268:276, 4%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (796:804, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) - server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (390:397, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (651:658, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:639, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (398:405, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (20:27, <1%) - server/text_generation_server/models/flash_causal_lm.py (22:29, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (141:151, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (80:90, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (190:199, 1%) - server/text_generation_server/layers/fp8.py (109:118, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (737:745, <1%) - server/text_generation_server/models/__init__.py (1674:1682, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (264:272, 1%) - server/text_generation_server/layers/fp8.py (365:373, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (206:213, 2%) - server/text_generation_server/layers/gptq/__init__.py (413:420, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (456:464, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (455:462, 1%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (141:148, 5%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:74, 8%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:773, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (696:704, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (74:81, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (128:135, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (277:285, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (205:212, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (629:637, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (655:663, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (918:927, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (92:101, 8%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (541:548, 1%) - server/text_generation_server/models/flash_causal_lm.py (1194:1201, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (750:757, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (660:667, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (507:516, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (535:544, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (100:108, 4%) - server/text_generation_server/layers/lora.py (106:114, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (378:386, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (696:704, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (478:486, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (164:172, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (407:415, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (701:709, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (559:567, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (477:485, <1%) - server/text_generation_server/models/seq2seq_lm.py (84:92, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/conv.py (9:17, 25%) - server/text_generation_server/layers/conv.py (27:35, 25%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (359:367, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (413:421, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (496:504, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (301:309, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (407:415, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (82:90, 1%) - server/text_generation_server/models/mamba.py (120:128, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (184:191, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (188:195, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (415:422, 2%) - server/text_generation_server/layers/gptq/__init__.py (242:249, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:780, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (422:429, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (428:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (180:190, 1%) - server/text_generation_server/models/mamba.py (200:210, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (708:715, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (398:405, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (318:325, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (283:290, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (30:37, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (130:137, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (486:493, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (440:447, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (83:93, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (138:148, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:637, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (575:583, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (796:804, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (880:888, 1%) - server/text_generation_server/models/custom_modeling/bloom_modeling.py (680:688, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (192:199, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (188:195, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (180:188, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (186:194, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/linear.py (18:25, 30%) - server/text_generation_server/layers/linear.py (68:75, 8%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (435:442, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (285:293, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:95, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:361, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (416:423, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (323:330, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (738:746, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (646:654, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (184:191, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (180:187, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1507:1514, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (300:307, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (832:840, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (796:804, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (390:397, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (398:405, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (660:668, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (681:689, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:228, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (113:120, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (128:135, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (113:120, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (86:93, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:95, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:170, 6%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (503:511, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (413:421, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1369:1376, <1%) - server/text_generation_server/models/causal_lm.py (501:508, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (379:386, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (62:69, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (180:187, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/conv.py (27:35, 25%) - server/text_generation_server/layers/conv.py (9:17, 25%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (257:264, 3%) - server/text_generation_server/server.py (265:272, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (62:74, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (22:34, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (133:140, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (157:164, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (697:704, <1%) - server/text_generation_server/models/__init__.py (1111:1119, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (496:503, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (497:504, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (697:704, <1%) - server/text_generation_server/models/__init__.py (1076:1084, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (327:336, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (683:691, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:367, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:90, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (545:552, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (567:575, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (513:520, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (962:969, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (447:456, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (242:250, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (708:715, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (660:667, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (298:305, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (309:316, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (449:456, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (623:630, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (205:212, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (278:286, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (510:517, <1%) - server/text_generation_server/models/__init__.py (704:711, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (669:677, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (88:97, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (101:110, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:639, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (651:658, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (151:158, 1%) - server/text_generation_server/models/custom_modeling/clip.py (128:135, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (30:37, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (86:93, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:639, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (660:667, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:340, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (162:170, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (632:639, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (768:775, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (407:415, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (147:156, 1%) - server/text_generation_server/models/causal_lm.py (147:156, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (57:64, 8%) - server/text_generation_server/models/custom_modeling/llava_next.py (140:147, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (356:364, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (515:522, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (497:504, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (82:90, 1%) - server/text_generation_server/models/idefics_causal_lm.py (87:95, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (147:156, 1%) - server/text_generation_server/models/mamba.py (176:183, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (708:715, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (533:540, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (231:241, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (235:245, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (378:386, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (498:507, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (92:101, 8%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (354:361, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (269:276, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (330:337, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:804, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:872, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (79:87, 3%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (76:84, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (378:386, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (311:319, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (24:37, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (56:68, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (332:341, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (153:160, 6%) - server/text_generation_server/layers/attention/kv_cache.py (171:178, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (583:591, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (413:421, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (58:65, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (56:63, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (105:113, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (45:52, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) - server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:93, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:170, 6%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (617:624, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) - server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (416:423, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (325:332, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:612, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (227:236, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (287:296, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (266:274, 3%) - server/text_generation_server/server.py (274:282, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) - server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (164:172, 4%) - server/text_generation_server/models/custom_modeling/idefics2.py (734:742, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (738:746, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (278:286, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (205:212, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (131:138, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (71:78, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:816, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) - server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (456:463, <1%) - server/text_generation_server/utils/hub.py (36:43, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (958:965, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (492:499, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (398:405, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (666:673, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:732, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (265:272, 3%) - server/text_generation_server/layers/medusa.py (123:130, 6%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (265:272, 3%) - server/text_generation_server/layers/medusa.py (84:91, 6%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (82:90, 1%) - server/text_generation_server/models/causal_lm.py (80:88, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (986:993, <1%) - server/text_generation_server/models/flash_causal_lm.py (1732:1739, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (167:175, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (159:167, 5%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (852:859, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) - server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (204:212, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (750:757, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (533:540, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (342:349, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (735:743, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (164:172, 4%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) - server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (708:715, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (651:658, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:284, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:184, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (998:1005, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) - server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (934:941, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) - server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:625, <1%) - server/text_generation_server/models/__init__.py (1049:1056, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (74:81, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (111:118, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (474:482, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (413:421, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:130, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (738:746, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (447:455, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (66:73, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (72:79, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:402, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:169, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:92, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (453:461, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (516:524, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (378:386, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (637:645, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (209:217, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (256:263, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (346:353, 2%) - server/text_generation_server/adapters/lora.py (389:396, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (507:516, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (544:553, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (346:353, 2%) - server/text_generation_server/adapters/lora.py (352:359, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/lora.py (346:353, 2%) - server/text_generation_server/adapters/lora.py (377:384, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (174:182, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (162:170, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (237:245, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (374:381, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (643:650, <1%) - server/text_generation_server/models/__init__.py (1262:1270, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (30:37, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (111:118, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (385:392, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (835:842, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (255:262, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (256:263, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (342:350, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (643:650, <1%) - server/text_generation_server/models/__init__.py (1674:1682, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (358:368, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (369:379, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (443:450, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (590:597, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (421:428, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (416:423, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (171:179, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (141:148, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (503:510, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (545:552, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (264:272, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:230, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (477:485, <1%) - server/text_generation_server/models/idefics_causal_lm.py (87:95, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (114:121, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (71:78, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (83:93, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (166:176, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (314:322, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (689:696, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (693:700, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (192:199, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (180:187, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (453:461, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (525:533, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:202, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (328:336, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (471:480, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:313, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (355:362, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (370:377, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1055:1063, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (266:274, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (113:120, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (130:137, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (447:454, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:367, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:92, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (253:260, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (403:410, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (392:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (387:394, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (320:327, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) - server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (145:153, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (156:164, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) - server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (228:235, 1%) - server/text_generation_server/models/causal_lm.py (213:220, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (749:760, 1%) - server/text_generation_server/models/idefics_causal_lm.py (743:754, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (94:105, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (39:50, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (448:455, <1%) - server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (479:486, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (369:378, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (219:227, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:80, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (426:433, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (271:278, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (400:407, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (535:542, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (381:388, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (257:264, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (302:310, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (250:258, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (316:323, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:283, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:180, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:292, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (266:274, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (484:492, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (708:715, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (768:775, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (455:462, 1%) - server/text_generation_server/layers/fp8.py (325:332, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (402:411, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:562, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (564:574, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (192:200, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (343:351, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (708:715, <1%) - server/text_generation_server/models/__init__.py (1143:1150, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1228:1235, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (596:603, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (273:280, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (390:397, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (768:775, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) - server/text_generation_server/layers/gptq/quantize.py (372:379, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (541:548, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (392:399, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (515:523, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (754:762, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1369:1376, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (151:158, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (738:746, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (433:441, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:583, <1%) - server/text_generation_server/models/__init__.py (816:823, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (140:147, 4%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (57:64, 8%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (369:376, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (226:233, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) - server/text_generation_server/layers/gptq/quantize.py (504:511, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (574:581, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (546:553, <1%) - server/text_generation_server/layers/gptq/quantize.py (404:411, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/hub.py (36:43, 4%) - server/text_generation_server/models/__init__.py (594:601, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (469:476, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (538:545, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (423:430, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1444:1451, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (30:37, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (128:135, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1374:1381, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (608:615, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:792, <1%) - server/text_generation_server/models/__init__.py (1340:1347, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:571, <1%) - server/text_generation_server/models/__init__.py (1408:1415, <1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (346:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:253, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (180:190, 1%) - server/text_generation_server/models/causal_lm.py (176:186, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (705:712, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (411:418, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (363:370, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (274:281, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (459:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (197:204, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (390:397, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (377:384, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (371:378, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (618:625, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (324:332, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (319:326, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (429:436, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:390, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (437:446, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (722:729, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (575:584, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (558:567, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (696:704, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:403, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (313:320, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (366:373, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (808:815, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (552:559, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (412:421, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (457:466, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (347:354, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (353:362, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (405:414, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (62:69, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (188:195, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (394:401, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (439:448, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (473:482, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (164:172, 4%) - server/text_generation_server/models/custom_modeling/idefics3.py (477:485, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (332:340, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (208:216, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:93, 2%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:361, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1507:1514, <1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (219:226, 3%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (123:133, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (80:90, 2%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (420:427, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (643:650, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (583:592, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (544:553, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (398:407, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (406:415, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (424:431, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (483:490, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (502:509, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (473:480, 1%) 8 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (332:340, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (384:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (174:181, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (223:231, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:42, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:38, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (98:106, <1%) - server/text_generation_server/models/causal_lm.py (94:102, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:41, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (256:262, 1%) - server/text_generation_server/layers/rotary.py (579:585, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (737:743, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (375:381, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (417:423, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (434:440, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (304:312, 1%) - server/text_generation_server/layers/gptq/__init__.py (223:231, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (279:287, 1%) - server/text_generation_server/models/custom_modeling/clip.py (288:296, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (81:87, 3%) - server/text_generation_server/utils/adapter.py (129:135, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (576:583, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (375:382, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (409:416, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (484:490, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (723:729, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (166:172, <1%) - server/text_generation_server/models/galactica.py (147:153, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:65, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (484:490, 1%) - server/text_generation_server/layers/fp8.py (206:212, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (79:85, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (57:63, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:859, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:636, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2465:2471, <1%) - server/text_generation_server/models/mamba.py (775:781, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (359:365, <1%) - server/text_generation_server/models/__init__.py (425:431, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (1017:1023, <1%) - server/text_generation_server/models/flash_causal_lm.py (1182:1188, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (407:416, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (417:426, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (470:476, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:859, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:636, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (484:490, 1%) - server/text_generation_server/layers/fp8.py (308:314, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (59:66, 14%) - server/text_generation_server/layers/compressed_tensors/wna16_int_24.py (47:54, 9%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:431, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:203, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (480:486, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (269:276, 3%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (554:560, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (411:417, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (83:90, 7%) - server/text_generation_server/models/custom_modeling/idefics3.py (547:554, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (820:827, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (782:789, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (59:65, 1%) - server/text_generation_server/layers/rotary.py (46:52, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (249:256, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (658:664, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (524:532, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (536:544, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (256:263, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (611:617, <1%) - server/text_generation_server/models/idefics_causal_lm.py (591:597, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (127:135, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (141:149, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (569:575, <1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (129:135, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (279:285, <1%) - server/text_generation_server/models/mamba.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (33:39, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (59:65, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (797:804, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:731, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (455:462, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:321, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1399:1405, <1%) - server/text_generation_server/models/seq2seq_lm.py (581:587, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1942:1948, <1%) - server/text_generation_server/models/mllama_causal_lm.py (258:264, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:207, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:534, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:215, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (575:581, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/marlin/gptq.py (108:115, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (480:486, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (797:804, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (98:106, <1%) - server/text_generation_server/models/idefics_causal_lm.py (112:120, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (166:172, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (300:306, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (258:264, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:22, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:39, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (147:153, 1%) - server/text_generation_server/layers/gptq/__init__.py (242:248, 1%) 7 duplicated lines in: - backends/neuron/server/text_generation_server/cli.py (18:49, 11%) - server/text_generation_server/cli.py (52:58, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (618:624, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (561:567, <1%) - server/text_generation_server/models/causal_lm.py (540:546, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:229, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (147:153, 1%) - server/text_generation_server/layers/gptq/__init__.py (311:317, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/speculate.py (1:11, 100%) - server/text_generation_server/utils/speculate.py (1:11, 100%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (202:209, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1049:1055, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (404:411, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (351:359, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (852:858, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (243:251, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (88:105, 1%) - server/text_generation_server/utils/logits_process.py (152:167, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (185:192, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (116:122, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (998:1004, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (216:223, 2%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (384:391, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (958:964, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (554:560, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (329:335, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (502:511, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (417:426, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (98:106, <1%) - server/text_generation_server/models/mamba.py (134:142, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (39:46, 3%) - server/text_generation_server/layers/moe/gptq_marlin.py (95:102, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (934:940, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (76:83, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (563:570, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (782:789, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (852:858, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (584:590, 1%) - server/text_generation_server/layers/rotary.py (254:260, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (59:65, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (73:79, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (934:940, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (958:964, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (117:124, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (113:120, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (816:822, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (138:144, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (134:140, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:39, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:284, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:193, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (998:1004, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (355:361, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (404:410, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (945:951, <1%) - server/text_generation_server/models/mllama_causal_lm.py (258:264, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (372:378, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (348:354, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/clip.py (264:271, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (702:709, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (127:135, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (214:220, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (214:220, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (248:254, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (624:630, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (111:117, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (219:225, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (127:135, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (131:137, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (167:173, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (816:822, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (352:361, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (297:305, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1399:1405, <1%) - server/text_generation_server/models/causal_lm.py (532:538, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1357:1363, <1%) - server/text_generation_server/models/__init__.py (1870:1876, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (55:61, 16%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (116:122, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (407:416, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (564:573, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (816:822, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (128:136, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (141:149, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (81:88, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (149:156, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (300:306, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (258:264, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (966:972, <1%) - server/text_generation_server/server.py (317:323, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (166:172, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:815, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (111:118, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (173:181, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (852:858, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (199:207, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (309:315, 2%) - server/text_generation_server/models/__init__.py (1819:1825, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (279:287, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (139:146, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:117, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (279:287, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (366:375, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (207:214, <1%) - server/text_generation_server/models/idefics_causal_lm.py (255:262, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:305, 1%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (78:84, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (417:423, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (498:504, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1399:1405, <1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (129:135, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:40, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (269:276, 3%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (367:374, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:611, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (235:241, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:47, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (36:43, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (736:742, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (597:603, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (486:492, 1%) - server/text_generation_server/models/mllama_causal_lm.py (258:264, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (172:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:611, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (187:195, 1%) - server/text_generation_server/layers/gptq/__init__.py (289:297, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (379:386, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (487:494, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (820:827, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (83:90, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (215:221, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (215:221, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (219:225, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (184:190, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (348:356, 1%) - server/text_generation_server/layers/rotary.py (301:307, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (934:940, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (217:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (175:181, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (958:964, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (133:140, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (204:212, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (998:1004, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1049:1055, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:42, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:38, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (59:66, 14%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (76:83, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2436:2442, <1%) - server/text_generation_server/models/causal_lm.py (776:782, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1049:1055, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (230:236, 1%) - server/text_generation_server/layers/rotary.py (126:132, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (539:548, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (450:459, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (687:694, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (805:812, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:663, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (993:999, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (223:229, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (392:401, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (507:516, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (196:202, 1%) - server/text_generation_server/layers/gptq/__init__.py (169:175, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (398:405, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (79:86, 3%) - server/text_generation_server/layers/exl2.py (59:66, 14%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:663, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:41, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:39, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (186:193, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (187:194, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/idefics2.py (818:825, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (114:120, 6%) - server/text_generation_server/layers/moe/fp8.py (96:102, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (378:384, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (196:202, 1%) - server/text_generation_server/layers/gptq/__init__.py (405:411, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (591:597, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (84:90, <1%) - server/text_generation_server/models/bloom.py (16:22, 23%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (404:410, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (58:68, <1%) - server/text_generation_server/models/mamba.py (91:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (695:701, <1%) - server/text_generation_server/models/__init__.py (1182:1188, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (79:86, 3%) - server/text_generation_server/layers/marlin/gptq.py (108:115, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (635:643, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (376:384, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (37:44, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:45, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (73:80, 3%) - server/text_generation_server/layers/moe/fp8.py (61:68, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (117:123, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (50:56, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:38, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:171, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (201:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:624, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (590:596, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (283:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (219:226, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (118:125, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:22, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:38, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (355:361, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (125:133, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (706:712, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (166:172, 3%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (966:972, <1%) - server/text_generation_server/cli.py (122:128, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (945:951, <1%) - server/text_generation_server/models/flash_causal_lm.py (1781:1787, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (935:942, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (1018:1025, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (281:290, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (450:459, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:154, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (401:410, 2%) - server/text_generation_server/models/custom_modeling/clip.py (605:616, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (560:567, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (563:570, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (83:90, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (198:204, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (81:87, 1%) - server/text_generation_server/layers/marlin/gptq.py (69:75, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (246:254, 1%) - server/text_generation_server/layers/gptq/__init__.py (223:231, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (364:370, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:779, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (386:392, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (576:582, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (234:240, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (448:454, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (89:95, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (50:56, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (234:240, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/exl2.py (59:66, 14%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:663, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (166:172, <1%) - server/text_generation_server/models/mamba.py (188:194, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:570, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (335:341, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/globals.py (42:52, 24%) - server/text_generation_server/models/globals.py (67:77, 13%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (139:145, 1%) - server/text_generation_server/layers/gptq/__init__.py (232:238, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (219:225, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (110:116, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (276:283, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (219:225, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (67:73, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:570, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (157:164, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (136:143, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (127:133, 1%) - server/text_generation_server/layers/rotary.py (228:234, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (544:550, 1%) - server/text_generation_server/models/custom_modeling/clip.py (461:467, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (429:436, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (207:214, <1%) - server/text_generation_server/models/mamba.py (224:231, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (522:528, <1%) - server/text_generation_server/models/__init__.py (662:668, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:284, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:193, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (210:216, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (219:225, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:196, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/custom_modeling/idefics2.py (736:742, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (503:509, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:42, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:39, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (166:172, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (166:172, 3%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (214:220, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (308:315, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (487:494, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1228:1234, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:815, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (573:579, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (266:272, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:859, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (153:159, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (598:605, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (291:298, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:431, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (702:709, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (446:453, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:815, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (99:105, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (591:597, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (833:840, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fused_moe.py (21:27, 7%) - server/text_generation_server/layers/moe/fused_moe_ipex.py (21:27, 17%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:235, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1444:1450, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1408:1414, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1374:1380, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (188:196, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (469:477, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (590:598, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (605:616, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (401:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:897, <1%) - server/text_generation_server/models/__init__.py (1340:1346, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (79:86, 3%) - server/text_generation_server/layers/compressed_tensors/wna16_int_24.py (47:54, 9%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1274:1280, <1%) - server/text_generation_server/models/flash_causal_lm.py (1141:1147, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (53:59, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (65:71, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (79:86, 3%) - server/text_generation_server/layers/compressed_tensors/wna16_int.py (59:66, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2436:2442, <1%) - server/text_generation_server/models/idefics_causal_lm.py (804:810, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (480:486, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (185:192, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:228, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (386:392, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (585:591, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (267:273, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (322:328, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1228:1234, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (204:210, 2%) - server/text_generation_server/models/__init__.py (428:434, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (59:66, 14%) - server/text_generation_server/layers/marlin/gptq.py (108:115, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (65:74, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (57:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (861:867, <1%) - server/text_generation_server/models/mamba.py (775:781, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (43:49, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (73:79, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (560:567, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (609:615, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:211, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (227:235, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (539:548, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (507:516, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (503:509, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (73:79, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (161:167, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (264:270, 1%) - server/text_generation_server/layers/fp8.py (308:314, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (737:743, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (335:341, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (247:253, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (161:167, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (576:583, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (630:636, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (411:417, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:184, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/cli.py (119:125, 2%) - server/text_generation_server/models/__init__.py (1819:1825, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (646:652, <1%) - server/text_generation_server/models/causal_lm.py (612:618, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:22, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:157, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/custom_modeling/llava_next.py (166:172, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1340:1346, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (833:840, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (208:215, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (147:154, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1374:1380, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1444:1450, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:598, <1%) - server/text_generation_server/models/__init__.py (1408:1414, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (84:90, <1%) - server/text_generation_server/models/galactica.py (64:70, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (79:85, 2%) - server/text_generation_server/layers/rotary.py (46:52, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (98:105, 2%) - server/text_generation_server/models/custom_modeling/clip.py (145:152, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (737:743, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (171:179, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (198:204, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (185:191, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (35:42, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (12:19, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (366:372, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (364:370, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:197, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (236:243, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (658:664, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (618:624, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1942:1948, <1%) - server/text_generation_server/models/flash_causal_lm.py (1781:1787, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (486:492, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (514:520, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (198:204, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (294:300, 1%) - server/text_generation_server/layers/rotary.py (352:360, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1371:1377, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (334:340, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (144:152, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (171:179, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (97:107, <1%) - server/text_generation_server/models/__init__.py (144:154, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (54:60, 13%) - server/text_generation_server/utils/peft.py (16:22, 13%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (91:98, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (559:567, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (455:463, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (58:68, <1%) - server/text_generation_server/models/causal_lm.py (54:64, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (312:319, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:40, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:41, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:173, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (223:231, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (231:237, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (607:613, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (821:828, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (849:856, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (742:749, <1%) - server/text_generation_server/models/causal_lm.py (706:713, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (818:825, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:779, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (158:164, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (773:779, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (60:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (440:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:779, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1399:1405, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (190:196, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:803, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (457:465, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (590:598, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (220:227, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (236:243, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (208:214, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (139:146, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (154:161, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (215:221, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (244:250, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (122:128, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (67:73, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (630:636, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (329:335, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (63:71, 4%) - server/text_generation_server/utils/merges/strategies.py (103:111, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (736:742, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (237:243, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (378:384, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (404:410, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (524:530, <1%) - server/text_generation_server/models/causal_lm.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (56:62, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (89:95, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (17:25, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:45, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/compressed_tensors/wna16_int_24.py (47:54, 9%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (99:105, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (322:330, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (327:335, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (479:485, <1%) - server/text_generation_server/models/galactica.py (64:70, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (125:131, 3%) - server/text_generation_server/utils/adapter.py (81:87, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/adapter.py (125:131, 3%) - server/text_generation_server/utils/adapter.py (129:135, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (736:742, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (103:111, 4%) - server/text_generation_server/utils/merges/strategies.py (63:71, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (128:136, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (269:276, 3%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (576:583, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (83:90, 7%) - server/text_generation_server/models/custom_modeling/idefics2.py (805:812, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:47, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:23, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:636, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (99:105, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:582, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (56:62, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (114:120, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (702:709, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (125:133, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (569:575, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (190:196, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (166:172, 3%) - server/text_generation_server/layers/moe/fp8.py (94:100, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (55:61, 16%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (118:124, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (336:343, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (326:333, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (72:79, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (198:204, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (56:62, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (131:137, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (275:281, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (585:591, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (878:884, <1%) - server/text_generation_server/models/__init__.py (1643:1649, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (670:676, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (245:252, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (737:743, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (214:220, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (215:221, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (326:332, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (818:825, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:41, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:20, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (303:310, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (635:643, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (455:463, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (488:494, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (494:500, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:284, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:193, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (371:377, 1%) - server/text_generation_server/layers/fp8.py (206:212, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (153:159, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (474:480, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1376:1382, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (254:260, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (269:276, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/compressed_tensors/wna16_int.py (59:66, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/llava_next.py (269:276, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (371:377, 1%) - server/text_generation_server/layers/fp8.py (365:371, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (285:292, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (248:254, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (141:149, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (241:248, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (210:217, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (660:666, <1%) - server/text_generation_server/models/mamba.py (466:472, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (90:97, 4%) - server/text_generation_server/utils/merges/strategies.py (107:114, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (480:486, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (580:586, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (28:37, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (57:66, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (315:323, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (243:251, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (431:437, 1%) - server/text_generation_server/layers/fp8.py (365:371, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:791, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (194:201, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (536:542, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (431:437, 1%) - server/text_generation_server/layers/fp8.py (206:212, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (155:162, 1%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (73:80, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:791, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (486:492, 1%) - server/text_generation_server/models/flash_causal_lm.py (1781:1787, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (64:70, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (54:60, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (667:673, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (524:530, <1%) - server/text_generation_server/models/mamba.py (389:395, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:284, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:136, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (128:136, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (99:107, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (306:312, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (279:285, <1%) - server/text_generation_server/models/causal_lm.py (265:271, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (480:486, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (165:171, <1%) - server/text_generation_server/models/seq2seq_lm.py (525:531, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (737:743, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:41, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (539:545, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/adapters/__init__.py (6:13, 100%) - server/text_generation_server/adapters/__init__.py (6:13, 100%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (77:83, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (59:65, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (153:159, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (448:454, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (575:581, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (203:211, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (137:144, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (155:162, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (136:143, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (795:802, 1%) - server/text_generation_server/models/custom_modeling/t5_modeling.py (991:998, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (536:542, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:134, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (254:260, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (144:152, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (153:159, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (257:263, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:871, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (130:137, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (59:65, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (696:703, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (375:381, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (56:62, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (133:139, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (142:150, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (220:227, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:871, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:175, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (183:189, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (113:119, 6%) - server/text_generation_server/layers/moe/fp8.py (161:167, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (559:567, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (376:384, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:41, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:41, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (166:172, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (243:251, 3%) - server/text_generation_server/layers/moe/fp8.py (158:166, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (55:61, 16%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (74:80, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (310:316, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (153:159, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (136:142, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (50:56, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (797:804, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (333:340, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:803, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (412:418, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:197, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:292, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (172:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (107:114, 4%) - server/text_generation_server/utils/merges/strategies.py (90:97, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (177:183, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (123:129, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (317:323, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (219:225, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:803, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (16:25, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (16:25, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (364:370, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (898:904, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (736:742, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (37:45, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:45, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (390:396, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (201:207, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/idefics3.py (560:567, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (407:416, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (335:344, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (166:173, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (440:446, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (372:378, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (378:384, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:175, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (265:271, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (479:485, <1%) - server/text_generation_server/models/bloom.py (16:22, 23%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (169:175, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (375:381, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (43:49, 1%) - server/text_generation_server/layers/rotary.py (46:52, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (221:229, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (252:259, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (508:515, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (166:172, <1%) - server/text_generation_server/models/causal_lm.py (163:169, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (99:105, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (243:250, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1374:1380, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1444:1450, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1408:1414, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2436:2442, <1%) - server/text_generation_server/models/mamba.py (726:732, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (706:712, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (247:253, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (110:116, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (485:492, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (755:762, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (457:465, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (581:589, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (609:615, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:611, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1340:1346, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (502:511, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (335:344, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (215:221, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (169:175, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (262:268, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (234:240, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:731, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:556, <1%) - server/text_generation_server/models/__init__.py (1228:1234, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (143:151, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:144, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (407:413, 1%) - server/text_generation_server/layers/gptq/__init__.py (232:238, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:731, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (60:69, <1%) - server/text_generation_server/models/__init__.py (99:108, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (559:567, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (489:497, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (134:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (50:56, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (216:222, 3%) - server/text_generation_server/layers/moe/unquantized.py (107:113, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (597:603, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/custom_modeling/idefics3.py (479:485, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (94:101, 7%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (946:953, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:20, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:42, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (315:322, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (348:355, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:207, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:624, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (742:749, <1%) - server/text_generation_server/models/mamba.py (656:663, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (484:490, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (251:258, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (234:240, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (31:41, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (40:47, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (502:508, <1%) - server/text_generation_server/models/__init__.py (696:702, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:624, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (611:617, <1%) - server/text_generation_server/models/mamba.py (409:415, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (379:386, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (219:226, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (187:194, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (648:654, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (539:545, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (139:146, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (152:159, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:871, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (60:69, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (25:34, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (671:677, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (16:22, 13%) - server/text_generation_server/utils/peft.py (54:60, 13%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (169:175, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (110:116, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (205:212, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (169:175, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (67:73, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (647:654, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (280:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (702:709, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (95:101, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (60:69, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (59:68, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (478:484, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (43:49, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (57:63, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (357:364, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (638:645, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (414:421, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (59:66, 14%) - server/text_generation_server/layers/compressed_tensors/wna16_int.py (59:66, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (281:290, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (507:516, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (475:482, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (448:455, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (302:308, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (180:187, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (284:291, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (238:245, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (145:152, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (98:105, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:42, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (667:673, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (739:746, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (110:116, <1%) - server/text_generation_server/models/idefics_causal_lm.py (123:129, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (500:507, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (269:276, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (183:189, 5%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (920:927, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (240:246, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (219:225, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (311:318, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (371:378, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (166:172, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:505, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (687:694, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (547:554, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (209:216, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (206:212, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (245:252, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (925:931, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (144:150, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:117, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (136:143, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:40, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:20, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (73:79, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (110:116, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (474:480, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:42, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:39, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (97:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (325:331, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (254:260, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (348:354, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (502:511, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (564:573, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (99:105, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (256:263, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (632:639, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (169:175, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (184:190, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (157:163, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (503:509, 1%) - server/text_generation_server/models/custom_modeling/bloom_modeling.py (361:367, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (412:418, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (651:657, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (264:271, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (193:200, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:387, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (590:598, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (249:256, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (208:214, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (516:523, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (185:192, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (197:204, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (621:628, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (403:410, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (635:643, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (489:497, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (176:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (206:212, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (245:252, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (234:240, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (347:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (602:608, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (609:615, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:41, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:38, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (163:170, 2%) - server/text_generation_server/server.py (182:189, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (333:340, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (484:491, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (57:63, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (142:149, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (246:253, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (159:165, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (219:225, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (697:704, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (723:729, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (833:840, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (524:531, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (410:417, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (434:441, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (461:467, 1%) - server/text_generation_server/models/custom_modeling/clip.py (544:550, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (198:204, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (223:230, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:171, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (96:103, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (280:288, 1%) - server/text_generation_server/models/custom_modeling/clip.py (288:296, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (646:652, <1%) - server/text_generation_server/models/idefics_causal_lm.py (627:633, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (155:161, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (279:286, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (202:208, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (265:272, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (277:284, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (180:186, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (272:279, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (343:350, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (232:239, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (199:206, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:182, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (480:486, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (63:69, 1%) - server/text_generation_server/models/custom_modeling/idefics_config.py (300:306, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (220:227, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (247:254, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (258:265, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (306:313, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (275:281, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (576:582, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (122:128, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (161:167, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (469:477, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (581:589, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (122:128, 3%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (184:190, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (360:367, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (504:511, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (385:392, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:582, <1%) - server/text_generation_server/models/__init__.py (891:897, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (670:676, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (245:252, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (98:104, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (102:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (396:403, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (144:152, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (125:133, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:284, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:159, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:582, <1%) - server/text_generation_server/models/__init__.py (764:770, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (146:154, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (171:179, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (584:591, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (341:348, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (214:220, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:170, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:118, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1359:1365, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (766:772, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (182:188, 5%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (148:154, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:183, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (392:401, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (450:459, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (457:464, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (282:289, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (569:575, <1%) - server/text_generation_server/models/causal_lm.py (532:538, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (59:66, 14%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (73:80, 4%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (166:172, 3%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:791, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (523:529, <1%) - server/text_generation_server/models/seq2seq_lm.py (167:173, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:296, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (124:130, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (446:453, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (702:709, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:182, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:209, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (122:129, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (181:188, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (46:52, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (74:80, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (228:234, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:304, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (31:38, 6%) - server/text_generation_server/layers/moe/gptq_marlin.py (95:102, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:570, <1%) - server/text_generation_server/models/__init__.py (1612:1618, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:155, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (230:236, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (193:200, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (281:288, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:148, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:148, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (470:476, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (521:527, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (216:223, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (207:214, <1%) - server/text_generation_server/models/causal_lm.py (199:206, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (149:164, 1%) - server/text_generation_server/utils/logits_process.py (91:108, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (361:367, 1%) - server/text_generation_server/models/custom_modeling/bloom_modeling.py (503:509, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:40, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:47, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:43, 2%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (166:172, 3%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (67:73, 7%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (100:106, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (185:191, 6%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (494:500, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (480:486, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (569:575, <1%) - server/text_generation_server/models/flash_causal_lm.py (1232:1238, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (166:172, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (219:225, <1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (97:103, 1%) - server/text_generation_server/models/custom_modeling/mamba_modeling.py (62:68, 3%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (408:415, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (587:594, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (271:278, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (344:351, 1%) 7 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (379:387, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (581:589, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (121:128, 6%) - server/text_generation_server/models/custom_modeling/llava_next.py (298:303, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (348:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (359:365, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (142:147, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (481:486, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (205:211, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (173:179, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/bloom.py (17:22, 20%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (164:169, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (913:918, <1%) - server/text_generation_server/models/flash_causal_lm.py (641:646, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (487:492, 1%) - server/text_generation_server/models/vlm_causal_lm.py (1004:1009, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (460:466, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (383:389, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (274:279, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (515:520, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (541:546, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (190:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (191:196, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (157:162, 1%) - server/text_generation_server/layers/fp8.py (239:244, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:95, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (150:155, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (103:108, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (73:78, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/mamba.py (123:128, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/causal_lm.py (83:88, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (660:665, <1%) - server/text_generation_server/models/idefics_causal_lm.py (661:666, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (157:162, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (154:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/gptq/__init__.py (193:198, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (576:581, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (77:82, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (193:198, 5%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (157:162, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (182:187, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (424:429, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (907:912, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (471:476, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (431:439, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (306:314, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) - server/text_generation_server/layers/gptq/quantize.py (521:526, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:291, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:44, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:39, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (600:605, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (298:303, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:135, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (36:42, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (38:44, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (149:156, <1%) - server/text_generation_server/models/idefics_causal_lm.py (204:211, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (88:93, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (659:664, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (726:732, <1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (292:298, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (449:454, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (649:654, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (207:212, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (428:436, 1%) - server/text_generation_server/utils/logits_process.py (265:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (958:963, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (998:1003, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (321:326, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (406:411, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (934:939, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (75:81, <1%) - server/text_generation_server/models/mamba.py (113:118, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (702:707, <1%) - server/text_generation_server/models/vlm_causal_lm.py (697:702, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (189:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (283:289, 3%) - server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1049:1054, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (114:120, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (175:181, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:227, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (57:62, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (75:80, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (75:81, <1%) - server/text_generation_server/models/idefics_causal_lm.py (80:85, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (217:223, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (372:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (764:769, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (570:575, <1%) - server/text_generation_server/models/causal_lm.py (613:618, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (267:272, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (270:275, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (60:65, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (35:41, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (36:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (816:821, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (194:199, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (155:160, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (182:187, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (852:857, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (350:355, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (891:896, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (591:596, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (286:291, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) - server/text_generation_server/layers/gptq/quantize.py (389:394, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (619:624, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) - server/text_generation_server/layers/gptq/quantize.py (421:426, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (177:182, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (138:143, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (118:123, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (454:459, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (454:459, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/loader.py (73:78, 5%) - server/text_generation_server/utils/weights.py (117:122, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (660:665, <1%) - server/text_generation_server/models/seq2seq_lm.py (610:615, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (207:212, 2%) - server/text_generation_server/models/custom_modeling/clip.py (288:294, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (803:810, <1%) - server/text_generation_server/models/flash_causal_lm.py (804:811, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (441:446, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (382:387, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (297:302, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (567:573, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/marlin/marlin.py (58:63, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (725:730, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (294:302, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (440:448, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (121:128, 6%) - server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (270:275, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/flash_causal_lm.py (1233:1238, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:167, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1559:1564, <1%) - server/text_generation_server/models/flash_causal_lm.py (1507:1512, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (456:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:129, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (401:406, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (524:529, <1%) - server/text_generation_server/models/galactica.py (147:152, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (34:39, 1%) - server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (877:882, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (424:429, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (348:353, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (82:87, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:125, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:168, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (40:46, <1%) - server/text_generation_server/models/flash_causal_lm.py (47:53, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (986:991, <1%) - server/text_generation_server/models/mllama_causal_lm.py (259:264, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (451:456, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (40:46, <1%) - server/text_generation_server/models/idefics_causal_lm.py (14:23, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (365:370, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (379:384, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:167, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:97, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (119:124, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (73:78, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/seq2seq_lm.py (582:587, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (389:394, <1%) - server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (17:22, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (280:286, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (318:323, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (218:223, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (24:29, 11%) - server/text_generation_server/utils/peft.py (16:21, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:466, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (278:283, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (389:394, <1%) - server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (598:603, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:209, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (339:345, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (825:831, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (194:199, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (352:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (371:377, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (78:83, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (342:347, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (748:755, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (298:303, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (144:149, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:92, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:88, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/quantization.py (143:148, 4%) - server/text_generation_server/utils/quantization.py (155:160, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (313:318, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:30, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (29:34, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/mllama_causal_lm.py (526:531, 1%) - server/text_generation_server/models/vlm_causal_lm.py (1004:1009, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (456:462, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (419:425, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (968:973, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (247:252, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (187:192, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (209:214, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:209, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (531:537, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (523:528, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (837:842, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (596:605, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (549:558, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (26:31, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:14, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (623:629, <1%) - server/text_generation_server/models/causal_lm.py (604:610, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (188:195, 1%) - server/text_generation_server/layers/gptq/__init__.py (158:165, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (385:390, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (441:446, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (62:67, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (365:370, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (401:406, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (247:252, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (346:355, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (473:482, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (481:486, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (150:155, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (165:171, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (151:156, 4%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (193:198, 5%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (37:42, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (456:462, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (388:394, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (188:195, 1%) - server/text_generation_server/layers/gptq/__init__.py (394:401, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (443:448, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (187:192, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (659:664, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (451:456, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (433:438, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:168, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (279:284, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (239:244, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (335:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:365, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (117:123, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (175:181, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (421:426, <1%) - server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (85:90, <1%) - server/text_generation_server/models/types.py (20:25, 7%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (51:56, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (57:62, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (809:814, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (357:362, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:135, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (322:327, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (339:345, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (328:334, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (319:325, 2%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (825:831, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (490:497, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (65:70, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (140:145, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/linear.py (6:11, 23%) - server/text_generation_server/layers/eetq.py (28:33, 18%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/flash_causal_lm.py (473:478, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (161:166, 3%) - server/text_generation_server/layers/lora.py (180:185, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:39, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:503, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (623:628, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (652:657, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1425:1430, <1%) - server/text_generation_server/models/mamba.py (455:460, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (115:120, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (111:117, 6%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (115:121, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (445:450, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:44, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (35:40, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (76:81, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (374:380, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (678:683, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:14, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (30:35, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (865:870, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (429:434, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (968:973, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (75:80, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (157:162, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (946:951, <1%) - server/text_generation_server/models/vlm_causal_lm.py (1004:1009, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:79, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (522:527, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (361:367, 1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (385:391, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (414:419, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (372:377, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (289:296, <1%) - server/text_generation_server/models/vlm_causal_lm.py (280:287, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (385:390, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (398:403, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (399:404, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:21, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (103:108, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (80:85, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:135, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (753:758, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (708:713, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (1157:1162, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (183:189, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (683:688, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (907:912, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (543:548, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (334:339, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (156:162, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (62:67, 11%) - server/text_generation_server/utils/peft.py (24:29, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (668:674, 1%) - server/text_generation_server/models/custom_modeling/mpt_modeling.py (1089:1095, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (62:67, 11%) - server/text_generation_server/utils/peft.py (54:59, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:203, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (356:361, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (246:251, 2%) - server/text_generation_server/layers/moe/gptq_marlin.py (171:176, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (458:464, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (486:492, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (156:162, 1%) - server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (78:83, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (193:198, 5%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (421:426, <1%) - server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (193:198, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (113:118, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/idefics_causal_lm.py (635:640, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (600:605, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (394:399, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (60:65, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (126:131, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (117:123, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (281:286, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (451:456, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (185:191, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (319:325, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (366:372, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (137:142, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (47:52, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (378:383, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (172:178, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (206:212, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (409:414, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (470:477, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:95, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (80:85, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (753:758, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (359:364, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (347:352, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (293:298, 3%) - server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (502:508, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (401:407, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (267:272, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (489:494, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (523:528, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (365:370, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (671:676, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (219:224, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (218:223, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (531:537, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (678:683, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (185:191, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:115, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (182:187, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (207:212, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (191:196, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (157:162, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (154:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (366:373, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (400:407, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (565:570, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (376:382, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (393:399, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (128:135, 1%) - server/text_generation_server/layers/gptq/__init__.py (224:231, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (266:272, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (353:359, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:183, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (402:407, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:183, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (780:785, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (300:307, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (351:358, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (761:766, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (78:83, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (34:41, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (724:729, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (259:264, 2%) - server/text_generation_server/cli.py (120:125, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (339:345, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (359:365, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (32:37, <1%) - server/text_generation_server/models/__init__.py (74:79, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (207:212, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:203, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/layernorm.py (34:40, 14%) - server/text_generation_server/layers/layernorm.py (77:83, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (319:325, 2%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (401:407, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (266:272, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (655:660, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (523:528, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (379:385, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/dist.py (49:55, 13%) - server/text_generation_server/utils/dist.py (65:71, 8%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (618:623, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (156:162, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (485:490, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (458:465, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (372:377, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (130:135, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (69:74, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (114:121, 4%) - server/text_generation_server/utils/merges/strategies.py (73:80, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (383:388, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (288:294, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (207:212, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (357:362, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (263:269, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (208:214, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:283, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (246:251, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (378:383, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (247:252, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (431:436, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (406:411, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (521:526, <1%) - server/text_generation_server/layers/gptq/quantize.py (565:570, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (40:46, <1%) - server/text_generation_server/models/causal_lm.py (19:30, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:283, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (400:407, 1%) - server/text_generation_server/layers/rotary.py (490:497, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (76:81, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (359:365, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (351:358, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (63:68, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (70:75, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (32:40, <1%) - server/text_generation_server/models/custom_modeling/t5_modeling.py (39:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (366:371, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (75:80, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:227, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (521:526, <1%) - server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (189:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (554:559, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (587:594, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (386:392, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (480:485, <1%) - server/text_generation_server/models/types.py (20:25, 7%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:138, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (235:240, 2%) - server/text_generation_server/utils/weights.py (261:266, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:125, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:88, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (339:345, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (284:290, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (349:354, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (668:673, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (610:615, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (350:355, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (27:33, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (33:39, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (366:371, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (477:482, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (400:407, 1%) - server/text_generation_server/layers/rotary.py (251:258, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (485:490, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (281:287, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (306:312, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (240:246, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (616:622, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:40, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (348:353, <1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (193:198, 5%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (599:606, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (504:511, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (348:353, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (152:157, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (81:86, 2%) - server/text_generation_server/layers/gptq/__init__.py (193:198, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:466, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (416:421, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:336, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (748:755, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (590:595, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (582:587, <1%) - server/text_generation_server/models/causal_lm.py (559:564, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (190:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (409:414, 1%) - server/text_generation_server/models/transformers_flash_vlm.py (420:425, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (190:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (570:575, <1%) - server/text_generation_server/models/idefics_causal_lm.py (628:633, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (570:575, <1%) - server/text_generation_server/models/idefics_causal_lm.py (635:640, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (429:434, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (895:900, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:44, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/merges/strategies.py (73:80, 4%) - server/text_generation_server/utils/merges/strategies.py (114:121, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (166:171, <1%) - server/text_generation_server/models/mamba.py (389:394, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (656:662, <1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (102:108, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:503, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (452:457, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (115:120, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:291, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (352:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (340:346, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:14, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (26:31, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (773:778, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (657:662, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (177:182, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (275:280, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (371:376, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (284:290, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (183:189, <1%) - server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (891:896, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/server.py (259:264, 2%) - server/text_generation_server/server.py (315:320, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:336, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (322:327, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (367:372, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (414:419, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (516:521, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (409:414, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (422:427, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (156:162, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (968:973, <1%) - server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (181:186, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:201, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (454:459, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:336, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:92, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:168, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (156:161, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (662:668, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (142:147, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (2457:2462, <1%) - server/text_generation_server/models/mamba.py (768:773, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (380:387, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:470, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (385:394, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (35:40, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (113:118, 5%) - server/text_generation_server/layers/moe/gptq_marlin.py (171:176, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (259:264, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (395:401, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (499:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (856:861, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (243:248, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:98, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (24:29, 11%) - server/text_generation_server/utils/peft.py (62:67, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:97, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (24:29, 11%) - server/text_generation_server/utils/peft.py (54:59, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (576:581, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (209:214, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (441:446, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (481:486, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (103:108, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (150:155, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (582:588, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (275:281, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (502:508, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (825:831, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (347:353, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (439:445, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (628:633, <1%) - server/text_generation_server/models/flash_causal_lm.py (900:905, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (365:370, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (348:353, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/marlin/gptq.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1400:1405, <1%) - server/text_generation_server/models/seq2seq_lm.py (661:666, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (336:341, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (374:380, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (523:528, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (99:106, 1%) - server/text_generation_server/layers/gptq/__init__.py (327:334, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (494:502, <1%) - server/text_generation_server/models/seq2seq_lm.py (474:482, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1037:1043, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (155:160, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (154:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (185:190, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (113:118, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (13:19, <1%) - server/text_generation_server/models/flash_causal_lm.py (14:20, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (280:285, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (968:973, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:91, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (40:46, <1%) - server/text_generation_server/models/mamba.py (20:28, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (628:633, <1%) - server/text_generation_server/models/flash_causal_lm.py (641:646, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (477:482, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (35:41, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (38:44, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (853:858, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (537:542, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (78:83, 1%) - server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:304, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (522:527, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (542:547, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (387:392, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (600:605, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (590:595, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (409:414, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1037:1043, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (189:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (273:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:129, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (504:509, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (454:459, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (399:404, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (562:567, <1%) - server/text_generation_server/models/idefics_causal_lm.py (619:624, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (305:310, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (32:40, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (138:143, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:115, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (477:482, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (85:90, 1%) - server/text_generation_server/models/custom_modeling/gemma3/configuration_gemma3.py (193:198, 5%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (130:138, 2%) - server/text_generation_server/layers/fp8.py (289:297, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (139:144, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (55:60, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (139:144, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (66:71, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (151:156, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (379:385, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (177:182, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (361:367, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (224:230, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:95, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (80:85, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:304, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:79, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (386:392, 2%) - server/text_generation_server/models/custom_modeling/clip.py (587:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (65:70, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (60:65, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (125:130, 4%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (65:70, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (414:419, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (525:530, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (33:39, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (753:758, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (489:494, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (439:445, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (856:861, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (298:303, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/seq2seq_lm.py (87:92, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (425:430, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (60:65, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (534:540, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (495:501, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:92, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (83:88, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (592:597, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:167, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (157:162, 1%) - server/text_generation_server/layers/marlin/marlin.py (58:63, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (225:230, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (340:346, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (366:372, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (396:401, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:466, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (437:442, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (619:624, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (520:529, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (558:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (495:500, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:201, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:98, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (610:615, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (235:242, 1%) - server/text_generation_server/layers/fp8.py (152:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (449:454, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (307:313, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (61:66, 12%) - server/text_generation_server/layers/marlin/marlin.py (58:63, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (610:615, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:227, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (161:166, 1%) - server/text_generation_server/layers/rotary.py (149:154, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (201:206, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (295:311, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (148:154, 2%) - server/text_generation_server/models/transformers_flash_causal_lm.py (52:57, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (167:174, 1%) - server/text_generation_server/layers/fp8.py (76:83, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (652:657, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:39, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (183:189, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (171:177, 1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (52:57, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (311:317, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (518:524, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (118:123, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (645:650, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (157:162, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:115, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (592:597, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (348:353, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (82:87, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (396:401, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (99:106, <1%) - server/text_generation_server/models/galactica.py (77:84, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (154:160, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (152:157, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (439:444, <1%) - server/text_generation_server/layers/gptq/quantize.py (538:543, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:304, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:129, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/idefics_causal_lm.py (90:95, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (170:175, 4%) - server/text_generation_server/layers/attention/kv_cache.py (243:248, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:283, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (65:70, 2%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (118:123, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (454:459, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (363:368, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (36:42, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (36:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (151:156, 4%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (342:347, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (262:268, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:138, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:359, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/lora.py (174:179, 3%) - server/text_generation_server/layers/lora.py (167:172, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (161:167, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:91, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:97, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (268:273, 2%) - server/text_generation_server/utils/weights.py (228:233, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:88, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (348:353, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (397:402, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (145:151, 1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (178:184, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (293:298, 3%) - server/text_generation_server/models/custom_modeling/llava_next.py (298:303, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (288:293, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (286:291, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (797:802, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (591:596, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (366:371, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (356:361, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (138:143, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (154:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (273:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (485:490, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (35:41, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (726:732, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (374:379, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (449:454, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (181:186, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (65:70, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (62:67, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:201, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:203, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/mlp.py (242:248, 2%) - server/text_generation_server/layers/medusa.py (97:103, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (75:80, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (368:373, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (742:748, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (78:83, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (279:285, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (524:529, <1%) - server/text_generation_server/models/causal_lm.py (163:168, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (61:66, 12%) - server/text_generation_server/layers/gptq/__init__.py (193:198, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/attention/kv_cache.py (99:104, 4%) - server/text_generation_server/layers/attention/kv_cache.py (232:237, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (385:390, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (59:64, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (126:131, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (899:904, <1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (742:747, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (630:635, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (9:18, 2%) - server/text_generation_server/models/custom_modeling/clip.py (12:20, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (90:95, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (73:78, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:283, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (350:355, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (877:882, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (683:688, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (138:143, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) - server/text_generation_server/layers/gptq/quantize.py (421:426, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) - server/text_generation_server/layers/gptq/quantize.py (389:394, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (293:298, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (280:285, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (121:128, 6%) - server/text_generation_server/models/custom_modeling/idefics3.py (590:595, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (467:472, <1%) - server/text_generation_server/layers/gptq/quantize.py (521:526, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (83:88, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:183, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (899:904, <1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (807:812, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (253:260, 1%) - server/text_generation_server/layers/rotary.py (401:408, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (77:82, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (342:347, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (350:355, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:201, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (207:213, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (264:270, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (598:603, <1%) - server/text_generation_server/models/seq2seq_lm.py (674:679, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (75:80, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (154:159, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (253:260, 1%) - server/text_generation_server/layers/rotary.py (490:497, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (78:83, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (476:481, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (295:300, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (219:224, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (528:535, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (558:564, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (406:411, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (293:298, 3%) - server/text_generation_server/models/custom_modeling/idefics3.py (590:595, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (51:56, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (39:44, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (33:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (780:785, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (145:151, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (556:562, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (12:20, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (9:18, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (806:813, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (532:539, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (63:68, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (113:118, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (385:390, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (397:402, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (258:263, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/causal_lm.py (533:538, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (598:603, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (724:729, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (531:537, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (439:445, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (451:456, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (780:785, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (20:27, <1%) - server/text_generation_server/models/__init__.py (49:57, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (935:941, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (541:546, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (130:136, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (443:448, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:98, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (134:139, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (291:296, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (443:448, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (540:545, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (37:42, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:79, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (335:340, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (110:115, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (154:159, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/exl2.py (61:66, 12%) - server/text_generation_server/layers/fp8.py (239:244, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (36:41, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (454:459, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (357:362, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (85:90, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (342:347, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (455:460, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (433:438, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (409:414, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (381:386, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:365, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (365:370, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (322:327, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (212:217, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (65:70, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (70:75, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (348:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (436:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:365, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (108:113, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (181:186, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (396:401, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (524:529, <1%) - server/text_generation_server/models/mamba.py (188:193, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (331:336, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (75:80, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (335:340, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (33:39, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fp8.py (246:251, 2%) - server/text_generation_server/layers/moe/unquantized.py (137:142, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (30:35, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:14, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (491:497, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (371:376, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (359:365, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (853:858, <1%) - server/text_generation_server/models/mamba.py (768:773, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (137:142, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (406:411, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (655:660, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (439:445, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (60:65, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (228:236, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (489:494, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (441:446, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (177:182, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (69:74, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1228:1233, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:291, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (379:384, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (134:139, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1374:1379, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (707:712, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1444:1449, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1408:1413, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (103:108, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (80:85, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (120:125, 2%) - server/text_generation_server/utils/weights.py (32:37, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/exl2.py (61:66, 12%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (374:380, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (439:445, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (13:19, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (185:191, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (189:195, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1340:1345, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1037:1043, <1%) - server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (225:233, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:125, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (84:90, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (376:381, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (142:147, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (515:520, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (936:941, <1%) - server/text_generation_server/models/__init__.py (1612:1617, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (281:286, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (51:56, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (548:555, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (791:798, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (31:37, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (279:284, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (394:399, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (86:92, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:359, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (255:260, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (414:419, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (348:353, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (117:122, <1%) - server/text_generation_server/models/custom_modeling/gemma3/processing_gemma3.py (105:110, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (396:401, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (138:143, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (829:834, <1%) - server/text_generation_server/models/transformers_flash_vlm.py (420:425, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (439:446, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (377:384, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (34:40, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (32:38, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (276:281, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (107:112, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (117:122, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (591:596, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (596:601, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (36:41, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (166:171, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (781:786, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (545:550, <1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (100:105, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (396:401, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (259:267, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (550:555, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (489:496, 1%) - server/text_generation_server/layers/rotary.py (251:258, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:209, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (78:83, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (209:214, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (769:776, <1%) - server/text_generation_server/models/idefics_causal_lm.py (759:766, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (347:355, <1%) - server/text_generation_server/models/idefics_causal_lm.py (394:402, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (254:259, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (219:224, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (335:340, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (47:52, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (130:135, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (174:179, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (489:496, 1%) - server/text_generation_server/layers/rotary.py (401:408, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (178:183, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (414:419, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (266:271, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/compressed_tensors/wna16_int.py (61:66, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (140:145, 2%) - server/text_generation_server/layers/compressed_tensors/w8a8_int.py (114:119, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (379:384, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (344:349, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (93:98, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (578:583, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (506:511, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (598:603, <1%) - server/text_generation_server/models/causal_lm.py (648:653, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/rotary.py (150:155, 1%) - server/text_generation_server/layers/rotary.py (160:165, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (142:147, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (696:702, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (475:480, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (570:575, <1%) - server/text_generation_server/models/seq2seq_lm.py (661:666, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/fused_moe.py (118:123, 6%) - server/text_generation_server/layers/moe/gptq_marlin.py (315:320, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (119:125, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:359, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (365:370, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (246:251, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (397:402, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (132:138, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (290:297, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (326:333, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (78:83, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (659:664, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (166:171, <1%) - server/text_generation_server/models/causal_lm.py (479:484, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (809:814, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (125:130, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:91, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (85:91, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (123:129, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (335:340, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llava_next.py (271:276, 3%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (479:484, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (619:624, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (608:613, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (579:584, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (400:405, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1610:1615, <1%) - server/text_generation_server/models/flash_causal_lm.py (1587:1592, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (137:142, 1%) - server/text_generation_server/models/custom_modeling/idefics_modeling.py (528:533, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1037:1043, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (77:82, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (426:431, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (355:360, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (336:341, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (428:433, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/medusa.py (97:103, 4%) - server/text_generation_server/layers/mlp.py (242:248, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (522:527, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (339:345, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (401:407, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (587:592, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (477:482, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (176:181, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (108:113, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (189:194, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (154:160, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (191:196, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (1037:1043, <1%) - server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (647:652, <1%) - server/text_generation_server/models/transformers_flash_causal_lm.py (130:135, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (352:360, 1%) - server/text_generation_server/layers/compressed_tensors/w8an_fp.py (118:126, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics3.py (241:247, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (185:191, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (487:492, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/__init__.py (396:403, 1%) - server/text_generation_server/layers/gptq/__init__.py (224:231, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (389:394, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (209:214, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (856:861, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (590:595, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (598:603, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (299:304, 1%) - server/text_generation_server/layers/compressed_tensors/wna16_int_24.py (49:54, 8%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (199:204, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (299:304, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (335:340, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (472:480, <1%) - server/text_generation_server/models/seq2seq_lm.py (496:504, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (222:227, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (173:180, <1%) - server/text_generation_server/models/custom_modeling/mllama.py (788:794, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (370:375, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (380:385, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/fp8.py (175:182, 1%) - server/text_generation_server/layers/fp8.py (100:107, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_vlm_causal_lm.py (986:991, <1%) - server/text_generation_server/models/flash_causal_lm.py (1782:1787, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (126:134, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (273:278, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/siglip.py (73:78, 2%) - server/text_generation_server/models/custom_modeling/clip.py (119:124, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (543:548, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (187:192, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (368:373, 1%) - server/text_generation_server/models/custom_modeling/phi_modeling.py (292:298, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (120:125, 2%) - server/text_generation_server/layers/compressed_tensors/loader.py (78:83, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (458:463, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (328:334, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (125:130, 4%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (56:61, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (425:430, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (87:93, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (353:359, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (349:354, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (362:367, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (57:62, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (461:466, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (347:353, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (678:683, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (865:870, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (16:21, 11%) - server/text_generation_server/utils/peft.py (62:67, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (16:21, 11%) - server/text_generation_server/utils/peft.py (24:29, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (280:285, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (34:39, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (704:709, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (196:201, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/linear.py (6:11, 23%) - server/text_generation_server/layers/linear.py (48:53, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (314:319, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (278:283, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (273:278, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (347:353, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (523:528, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (112:117, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (605:610, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (113:118, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (198:203, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (511:516, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (441:446, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (502:507, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (416:422, <1%) - server/text_generation_server/models/causal_lm.py (347:353, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (540:545, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:138, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (82:88, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (699:704, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (311:317, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (527:533, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (498:503, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (535:540, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (260:265, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (589:594, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (371:376, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (328:334, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:135, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (266:271, 2%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:79, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (475:480, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (316:321, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (219:224, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (359:364, 1%) - server/text_generation_server/models/custom_modeling/opt_modeling.py (484:489, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (301:308, <1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (351:358, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (461:466, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/w8an_fp.py (81:86, 2%) - server/text_generation_server/layers/marlin/marlin.py (58:63, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (359:365, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (91:97, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/bloom_modeling.py (846:852, <1%) - server/text_generation_server/models/custom_modeling/neox_modeling.py (771:777, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (540:545, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (54:59, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (140:145, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (443:448, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (34:39, 1%) - server/text_generation_server/models/custom_modeling/idefics3.py (152:157, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/logits_process.py (266:273, 1%) - server/text_generation_server/utils/logits_process.py (427:435, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (904:909, <1%) - server/text_generation_server/models/__init__.py (1641:1646, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/idefics3.py (562:567, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (748:755, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (847:852, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (450:455, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (191:198, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:30, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:30, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/moe/unquantized.py (44:49, 5%) - server/text_generation_server/layers/moe/fp8.py (56:61, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (950:955, <1%) - server/text_generation_server/server.py (230:235, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (335:340, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (483:488, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1645:1650, <1%) - server/text_generation_server/models/flash_causal_lm.py (1526:1531, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (178:183, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (336:341, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (416:421, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (252:257, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (378:383, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (348:353, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (75:80, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (215:223, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (948:953, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (217:222, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (209:214, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (62:67, 11%) - server/text_generation_server/utils/peft.py (16:21, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (132:138, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (162:168, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/types.py (20:25, 8%) - server/text_generation_server/models/galactica.py (65:70, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (801:807, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (393:399, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (183:189, <1%) - server/text_generation_server/models/custom_modeling/clip.py (244:250, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (445:450, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (477:482, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (496:501, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (486:491, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (47:52, 1%) - server/text_generation_server/models/custom_modeling/clip.py (129:134, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (250:258, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (123:128, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (222:227, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (90:95, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (235:243, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (397:402, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (357:362, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (348:354, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (469:476, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (183:189, <1%) - server/text_generation_server/models/custom_modeling/idefics2.py (242:248, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:209, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (231:237, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (100:106, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (103:109, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (232:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (328:336, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (256:264, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (207:212, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (219:224, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (164:169, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (349:354, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (240:245, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (395:400, <1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (413:418, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (368:373, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (194:202, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (545:550, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/gptq/quantize.py (538:543, <1%) - server/text_generation_server/layers/gptq/quantize.py (439:444, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (207:212, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1400:1405, <1%) - server/text_generation_server/models/idefics_causal_lm.py (635:640, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1400:1405, <1%) - server/text_generation_server/models/idefics_causal_lm.py (628:633, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (341:349, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (30:35, 2%) - server/text_generation_server/layers/compressed_tensors/loader.py (78:83, 4%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (671:676, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (191:196, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (336:341, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (307:313, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (353:359, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (464:469, <1%) - server/text_generation_server/models/custom_modeling/llava_next.py (271:276, 3%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (118:123, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (143:148, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (129:135, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (357:362, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (289:294, 1%) - server/text_generation_server/models/custom_modeling/idefics2.py (820:825, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (660:665, <1%) - server/text_generation_server/models/causal_lm.py (573:578, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1943:1948, <1%) - server/text_generation_server/models/vlm_causal_lm.py (1004:1009, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1990:1995, <1%) - server/text_generation_server/models/vlm_causal_lm.py (1004:1009, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (328:334, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (353:359, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (54:59, 11%) - server/text_generation_server/utils/peft.py (62:67, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (332:340, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/clip.py (288:294, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (314:320, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/peft.py (54:59, 11%) - server/text_generation_server/utils/peft.py (24:29, 11%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (149:154, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (262:270, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (412:417, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (437:442, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (396:401, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (510:515, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_moe_modeling.py (149:154, 4%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (94:99, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (217:222, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (659:664, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/layers/compressed_tensors/loader.py (73:78, 5%) - server/text_generation_server/utils/weights.py (32:37, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (433:438, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (270:275, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (182:187, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (153:158, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (190:195, 2%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (447:452, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (204:209, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (110:115, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (69:74, 2%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (134:139, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (74:79, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (620:625, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (75:81, <1%) - server/text_generation_server/models/causal_lm.py (73:78, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_vl.py (156:162, 1%) - server/text_generation_server/models/custom_modeling/siglip.py (173:179, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (386:391, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (201:206, <1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (115:120, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/qwen2_5_vl.py (922:927, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (381:386, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_moe_modeling.py (518:523, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (632:637, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (392:397, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/idefics2.py (835:840, <1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (652:657, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (724:729, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (416:421, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (741:746, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (231:236, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (290:298, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (35:40, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (37:42, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (127:133, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (183:188, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/seq2seq_lm.py (598:603, <1%) - server/text_generation_server/models/mamba.py (466:471, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (810:815, <1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (658:663, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (946:951, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (127:132, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (175:180, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (373:378, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (315:320, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (356:361, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (553:558, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (88:93, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (209:214, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (387:392, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (150:155, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (365:370, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (36:41, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (351:356, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (462:467, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (327:335, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (640:645, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/flash_causal_lm.py (1400:1405, <1%) - server/text_generation_server/models/causal_lm.py (613:618, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (566:571, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (663:668, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (200:208, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (299:307, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (682:687, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (25:30, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (25:30, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (416:421, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (539:544, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (630:635, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (245:250, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (310:315, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (336:341, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (548:553, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (489:494, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (678:683, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (757:762, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (540:545, <1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (572:577, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (178:186, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (194:201, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (242:249, <1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (207:215, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (415:420, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (702:707, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (785:790, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (680:685, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/utils/weights.py (30:35, 2%) - server/text_generation_server/utils/weights.py (117:122, 2%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (383:388, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (174:179, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (294:299, 2%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (475:480, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/__init__.py (564:569, <1%) - server/text_generation_server/models/__init__.py (1703:1708, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (290:295, 1%) - server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (206:211, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (318:326, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (239:244, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (286:291, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (273:278, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (345:350, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (135:140, 1%) - server/text_generation_server/models/custom_modeling/mllama.py (203:208, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (298:303, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (500:505, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (149:154, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (510:515, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (362:367, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_qwen3_modeling.py (59:64, 2%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (240:245, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (288:296, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (159:167, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:129, 1%) - server/text_generation_server/models/custom_modeling/idefics_vision.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (642:647, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (410:415, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (205:213, 1%) - server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (265:273, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mllama.py (916:921, <1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (522:527, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (35:40, <1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (15:20, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_starcoder2_modeling.py (586:591, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (588:593, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (36:41, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (41:46, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (799:804, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (255:263, 1%) - server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (230:238, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (398:403, 1%) - server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (454:459, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_santacoder_modeling.py (431:436, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (398:403, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (682:687, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (576:581, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (416:421, 1%) - server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (410:415, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (353:358, 1%) - server/text_generation_server/models/custom_modeling/flash_neox_modeling.py (405:410, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (369:374, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma3_modeling.py (393:398, <1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (597:602, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (114:120, 1%) - server/text_generation_server/models/custom_modeling/flash_phi_modeling.py (113:119, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (9:14, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (26:31, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (436:441, 1%) - server/text_generation_server/models/custom_modeling/flash_gemma2_modeling.py (533:538, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_deepseek_v2_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_cohere_modeling.py (458:463, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (195:200, 1%) - server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (177:182, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (547:552, 1%) - server/text_generation_server/models/custom_modeling/flash_pali_gemma_modeling.py (96:101, 6%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gpt2_modeling.py (377:382, 1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (343:348, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (459:464, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (451:456, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_mistral_modeling.py (124:129, 1%) - server/text_generation_server/models/custom_modeling/flash_gptj_modeling.py (132:137, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (968:973, <1%) - server/text_generation_server/models/custom_modeling/flash_qwen2_modeling.py (60:65, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama4_modeling.py (839:844, <1%) - server/text_generation_server/models/custom_modeling/qwen2_vl.py (526:531, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_rw_modeling.py (623:628, 1%) - server/text_generation_server/models/custom_modeling/flash_deepseek_v3_modeling.py (649:654, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_llama_modeling.py (223:231, 1%) - server/text_generation_server/models/custom_modeling/flash_mixtral_modeling.py (264:272, 1%) 6 duplicated lines in: - backends/gaudi/server/text_generation_server/models/custom_modeling/flash_dbrx_modeling.py (402:407, <1%) - server/text_generation_server/models/custom_modeling/flash_gemma_modeling.py (335:340, 1%)