path # lines of code # active days days since first update days since last update # commits # contributors first updated last updated first contributor last contributor bazel/bundle.bzl 519 1 504 504 1 1 2023-12-28 2023-12-28 xinfeishi@gmail.com xinfeishi@gmail.com bazel/pyc_wheel.py 129 1 504 504 1 1 2023-12-28 2023-12-28 xinfeishi@gmail.com xinfeishi@gmail.com bazel/defs.bzl 251 11 504 31 11 5 2023-12-28 2025-04-14 xinfeishi@gmail.com rtp-llm@alibaba bazel/arch_select.bzl 121 2 504 489 2 2 2023-12-28 2024-01-12 xinfeishi@gmail.com liukan.lk@alibaba-inc.com bazel/upload_package.py 48 1 504 504 1 1 2023-12-28 2023-12-28 xinfeishi@gmail.com xinfeishi@gmail.com bazel/tf_http_archive.bzl 260 1 182 182 1 1 2024-11-14 2024-11-14 rtp-llm@alibaba rtp-llm@alibaba bazel/tf_proto.bzl 398 2 394 213 2 1 2024-04-16 2024-10-14 rtp-llm@alibaba rtp-llm@alibaba bazel/py_proto.bzl 41 1 119 119 1 1 2025-01-16 2025-01-16 rtp-llm@alibaba rtp-llm@alibaba workspace.bzl 12 2 504 342 2 2 2023-12-28 2024-06-07 xinfeishi@gmail.com rtp-llm@alibaba example/perf_test/defs.bzl 140 4 294 156 4 1 2024-07-25 2024-12-10 rtp-llm@alibaba rtp-llm@alibaba open_source/bazel/arch_select.bzl 121 38 489 8 43 4 2024-01-12 2025-05-07 liukan.lk@alibaba-inc.com rtp-llm@alibaba def.bzl 193 14 504 287 16 5 2023-12-28 2024-08-01 xinfeishi@gmail.com rtp-llm@alibaba benchmark/benchmark_serving.py 223 1 470 470 1 1 2024-01-31 2024-01-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/metrics/kmonitor_metric_reporter.py 48 11 511 37 11 2 2023-12-21 2025-04-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/metrics/__init__.py 5 2 504 259 2 2 2023-12-28 2024-08-29 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/device/__init__.py 30 3 296 71 3 1 2024-07-23 2025-03-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/device/device_impl.py 305 14 296 66 15 3 2024-07-23 2025-03-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/device/device_base.py 40 7 296 71 7 1 2024-07-23 2025-03-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/distribute/worker_info.py 253 34 504 22 35 3 2023-12-28 2025-04-23 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/distribute/gang_info.py 137 13 504 25 14 2 2023-12-28 2025-04-20 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/distribute/gang_server.py 267 21 511 29 21 2 2023-12-21 2025-04-16 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/distribute/gang_test_util.py 40 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/start_frontend_server.py 31 3 72 37 3 1 2025-03-04 2025-04-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/pipeline/pipeline.py 256 57 504 22 72 3 2023-12-28 2025-04-23 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/pipeline/__init__.py 1 1 493 493 1 1 2024-01-08 2024-01-08 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/pipeline/default_plugin.py 44 6 444 144 6 1 2024-02-26 2024-12-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/pipeline/chatapi_format.py 38 3 504 419 3 2 2023-12-28 2024-03-22 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/pipeline/pipeline_custom_func.py 35 2 444 72 2 1 2024-02-26 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/async_model.py 62 34 511 25 40 3 2023-12-21 2025-04-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/backend_rpc_server_visitor.py 24 2 72 25 2 1 2025-03-04 2025-04-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/engine_creator.py 26 23 511 8 23 2 2023-12-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/embedding/embedding_engine.py 47 16 349 133 18 1 2024-05-31 2025-01-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/embedding/interface.py 30 6 349 178 6 1 2024-05-31 2024-11-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/base_engine.py 25 6 323 90 6 1 2024-06-26 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/async_decoder_engine/rpc_engine.py 50 14 323 35 15 1 2024-06-26 2025-04-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/grpc_util.py 51 1 154 154 1 1 2024-12-12 2024-12-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/mm_process_engine.py 52 17 330 154 19 1 2024-06-19 2024-12-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/util.py 163 21 504 46 21 2 2023-12-28 2025-03-30 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/oss_util.py 15 1 309 309 1 1 2024-07-10 2024-07-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/nccl_util.py 9 1 402 402 1 1 2024-04-08 2024-04-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/token_processor.py 110 4 261 140 4 1 2024-08-27 2024-12-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/word_util.py 84 7 504 147 7 2 2023-12-28 2024-12-19 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/tokenizer_utils.py 119 3 504 344 3 2 2023-12-28 2024-06-05 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/database.py 126 21 442 8 22 1 2024-02-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/tensor_utils.py 9 1 380 380 1 1 2024-04-30 2024-04-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/complete_response_async_generator.py 32 1 436 436 1 1 2024-03-05 2024-03-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/thread_safe_deque.py 33 1 437 437 1 1 2024-03-04 2024-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/gemm_utils/device_map.py 58 3 325 90 3 1 2024-06-24 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/gemm_utils/__init__.py 6 2 325 90 2 1 2024-06-24 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/gemm_utils/cutlass_config.py 46 6 351 8 6 1 2024-05-29 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/ft_plugin.py 51 3 504 283 3 2 2023-12-28 2024-08-05 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/dump_config_utils.py 25 3 493 218 3 2 2024-01-08 2024-10-09 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/check_util.py 21 1 170 170 2 1 2024-11-26 2024-11-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/multimodal_util.py 94 17 323 72 17 2 2024-06-26 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/llama/hf_llama_convert.py 290 1 392 392 1 1 2024-04-18 2024-04-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/llama/smoothquant.py 150 1 392 392 1 1 2024-04-18 2024-04-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/llama/convert.py 191 1 392 392 1 1 2024-04-18 2024-04-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/qwen/smoothquant.py 158 1 389 389 1 1 2024-04-21 2024-04-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/qwen/convert.py 207 1 389 389 1 1 2024-04-21 2024-04-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/qwen/hf_qwen_convert.py 304 1 389 389 1 1 2024-04-21 2024-04-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/smooth_quant_convert/qwen/utils.py 122 1 389 389 1 1 2024-04-21 2024-04-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/concurrency_controller.py 53 3 504 44 3 2 2023-12-28 2025-04-01 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/model_weight.py 1001 92 511 7 109 2 2023-12-21 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/export_utils.py 19 1 420 420 1 1 2024-03-21 2024-03-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/fuser.py 178 5 489 121 5 2 2024-01-12 2025-01-14 liukan.lk@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/weight_type.py 37 3 337 199 3 1 2024-06-12 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/meta_pickler.py 234 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/utils/time_util.py 34 2 504 199 2 2 2023-12-28 2024-10-28 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/lru_dict.py 27 5 504 322 5 2 2023-12-28 2024-06-27 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/utils/ckpt_file_info.py 155 7 371 8 7 1 2024-05-09 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/import_util.py 11 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/utils/flash_attn_utils.py 6 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/utils/version_info.py 13 1 511 511 1 1 2023-12-21 2023-12-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen2_vl/qwen2_vl_vit.py 175 9 234 143 9 1 2024-09-23 2024-12-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen2_vl/activations.py 113 1 234 234 1 1 2024-09-23 2024-09-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen2_vl/image_processing_qwen2_vl.py 270 2 234 183 2 1 2024-09-23 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen2_vl/modeling_qwen2_vl.py 271 4 234 199 4 1 2024-09-23 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen2_vl/qwen2_vl.py 152 11 234 8 11 1 2024-09-23 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/whisper.py 95 14 328 149 15 1 2024-06-21 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/bloom.py 120 10 504 8 10 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/eva2clip_vit.py 165 9 330 183 11 1 2024-06-19 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_vl_vit.py 291 16 477 247 23 1 2024-01-24 2024-09-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/cogvlm2.py 184 25 335 149 38 1 2024-06-14 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/jina_bert/jina_bert_weight.py 115 4 301 8 4 1 2024-07-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/jina_bert/jina_bert.py 27 2 301 300 2 1 2024-07-18 2024-07-19 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/minicpmv/modeling_navit_siglip.py 566 2 248 233 2 1 2024-09-09 2024-09-24 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/minicpmv/resampler.py 565 1 248 248 1 1 2024-09-09 2024-09-09 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/minicpmv/minicpmv.py 234 9 248 8 10 1 2024-09-09 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/chat_glm_v4_vision_weight.py 17 6 330 90 6 1 2024-06-19 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/rotary_embedding/deepseek_rotary_embedding.py 169 1 73 73 1 1 2025-03-03 2025-03-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_v3_moe.py 30 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/deepseek_v2.py 310 22 237 8 25 1 2024-09-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/sgpt_bloom_vector.py 61 2 504 447 2 2 2023-12-28 2024-02-23 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/glm_v2_weight.py 59 6 504 8 6 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/__init__.py 40 29 504 34 30 3 2023-12-28 2025-04-11 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/base_model.py 467 90 511 8 105 2 2023-12-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/deepseek_dequant.py 18 1 42 42 1 1 2025-04-03 2025-04-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/llava.py 158 49 504 59 58 2 2023-12-28 2025-03-17 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/cosyvoice_qwen.py 22 1 129 129 1 1 2025-01-06 2025-01-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/starcoder2.py 153 10 437 8 10 1 2024-03-04 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/llava_vit.py 750 28 477 135 29 1 2024-01-24 2024-12-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/bert.py 94 15 429 146 15 1 2024-03-12 2024-12-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/propose_model/propose_model.py 6 2 268 210 2 1 2024-08-20 2024-10-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/falcon.py 77 11 504 8 11 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/chat_glm_v4_vision.py 52 23 330 8 27 1 2024-06-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_v2.py 194 40 449 8 44 1 2024-02-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/sgpt_bloom.py 56 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/models/multimodal/multimodal_mixin.py 202 20 311 8 21 1 2024-07-08 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/multimodal/multimodal_common.py 94 17 311 147 19 1 2024-07-08 2024-12-19 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/multimodal/multimodal_trt_engine.py 226 3 311 286 4 1 2024-07-08 2024-08-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/mixtral.py 113 19 479 8 19 1 2024-01-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/mpt.py 57 7 504 8 7 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/megatron_bert.py 28 3 367 154 3 1 2024-05-13 2024-12-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/llava_weight.py 18 10 504 8 10 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/internvl.py 89 8 260 72 8 1 2024-08-28 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/phi.py 63 11 504 8 11 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/qwen_v2_moe.py 69 12 386 8 12 1 2024-04-24 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/gpt_util/rms.py 27 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/models/gpt_util/prefix_encoder.py 28 2 504 493 2 1 2023-12-28 2024-01-08 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/models/cogvlm2_weight.py 187 7 335 8 7 1 2024-06-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/internvl_weight.py 117 4 260 8 4 1 2024-08-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/chat_glm_v4.py 18 6 337 8 6 1 2024-06-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/internvl_vit.py 555 8 260 183 8 1 2024-08-28 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_vl_weight.py 14 13 504 90 14 2 2023-12-28 2025-02-14 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/qwen_v2_audio/qwen_v2_audio.py 50 9 261 8 10 1 2024-08-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_v2_audio/configuration_qwen2_audio.py 79 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_v2_audio/modeling_qwen2_audio.py 315 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/qwen_v2_audio/processor.py 59 3 261 183 3 1 2024-08-27 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/chat_glm_v2.py 92 14 504 210 14 2 2023-12-28 2024-10-17 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/qwen.py 209 37 504 8 39 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/qwen_vl.py 132 47 504 183 59 2 2023-12-28 2024-11-13 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/starcoder.py 121 17 504 8 17 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/gpt_weight.py 40 4 504 8 4 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/gpt_neox_weight.py 106 5 504 8 5 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/downstream_modules/plugin_loader.py 22 1 380 380 1 1 2024-04-30 2024-04-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/__init__.py 8 5 380 146 5 1 2024-04-30 2024-12-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/all_embedding_module.py 56 10 367 149 10 1 2024-05-13 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/misc.py 90 11 380 228 11 1 2024-04-30 2024-09-29 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/api_datatype.py 76 7 380 185 7 1 2024-04-30 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/minicpmv_embedding_module.py 297 5 244 149 5 1 2024-09-13 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/sparse_emebdding_module.py 71 5 380 149 5 1 2024-04-30 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/bge_m3_embedding_module.py 73 2 228 176 2 1 2024-09-29 2024-11-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/dense_embedding_module.py 86 12 380 149 12 1 2024-04-30 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/embedding/colbert_embedding_module.py 53 8 380 149 8 1 2024-04-30 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/classifier/util.py 11 1 380 380 1 1 2024-04-30 2024-04-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/classifier/bert_classifier.py 55 3 288 118 3 1 2024-07-31 2025-01-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/classifier/api_datatype.py 10 2 380 359 2 1 2024-04-30 2024-05-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/classifier/roberta_classifier.py 33 3 380 118 3 1 2024-04-30 2025-01-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/classifier/classifier.py 45 9 380 118 9 1 2024-04-30 2025-01-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/reranker/reranker_module.py 52 6 359 146 7 1 2024-05-21 2024-12-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/reranker/api_datatype.py 19 3 359 183 3 1 2024-05-21 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/utils.py 35 7 380 146 7 1 2024-04-30 2024-12-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/custom_module.py 48 12 380 118 12 1 2024-04-30 2025-01-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/downstream_modules/common_input_generator.py 43 8 380 140 8 1 2024-04-30 2024-12-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/llama.py 186 31 504 149 36 2 2023-12-28 2024-12-17 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/llava_utils.py 104 3 358 139 4 1 2024-05-22 2024-12-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/minicpmv_embedding/minicpmv_embedding.py 289 7 244 149 7 1 2024-09-13 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/minicpmv_embedding/resampler.py 112 1 244 244 1 1 2024-09-13 2024-09-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/whisper_weight.py 64 3 328 8 3 1 2024-06-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/chat_glm_v3.py 24 10 504 8 10 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/bert_weight.py 127 10 429 8 10 1 2024-03-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/gpt_neox.py 115 12 504 210 12 2 2023-12-28 2024-10-17 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/models/megatron_bert_weight.py 84 4 367 8 4 1 2024-05-13 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/models/llama_weight.py 281 16 504 8 18 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tools/fake_bloom.py 58 2 504 489 2 2 2023-12-28 2024-01-12 xinfei.sxf@alibaba-inc.com liukan.lk@alibaba-inc.com maga_transformer/tools/api/__init__.py 1 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tools/api/model_basic_info_analyzer_api.py 33 2 170 112 2 1 2024-11-26 2025-01-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/api/utils.py 4 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tools/api/model_size_evaluator_api.py 74 1 170 170 1 1 2024-11-26 2024-11-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/api/model_basic_info_analyzer.py 189 4 170 112 4 1 2024-11-26 2025-01-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/api/hf_model_helper.py 117 9 504 122 10 2 2023-12-28 2025-01-13 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tools/__init__.py 1 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tools/model_assistant_server.py 52 2 504 442 2 2 2023-12-28 2024-02-28 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tools/convert/weights_convert.py 232 11 154 8 12 1 2024-12-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/weights_quant.py 316 4 199 8 5 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/__init__.py 10 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/base_quanter.py 60 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/fp8_quanter.py 217 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/awq_quanter.py 31 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/gptq_quanter.py 32 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/quant/datasets_adapter.py 82 2 199 8 2 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tools/fake_model_base.py 189 2 504 8 2 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tools/fake_gpt_neox.py 62 2 504 489 2 2 2023-12-28 2024-01-12 xinfei.sxf@alibaba-inc.com liukan.lk@alibaba-inc.com maga_transformer/tools/log_analyze.py 69 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tools/fake_qwen.py 73 4 504 281 4 3 2023-12-28 2024-08-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tools/fake_glm_v2.py 63 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tools/fake_util.py 20 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/__init__.py 46 10 504 91 12 4 2023-12-28 2025-02-13 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/lora/__init__.py 1 1 268 268 1 1 2024-08-20 2024-08-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/lora/lora_manager.py 70 3 268 8 3 1 2024-08-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/lora/lora_file.py 129 3 268 8 3 1 2024-08-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/lora/lora_weights.py 34 3 268 8 3 1 2024-08-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/start_backend_server.py 137 3 72 29 3 1 2025-03-04 2025-04-16 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/config/base_model_config.py 6 1 429 429 1 1 2024-03-12 2024-03-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/config/generate_config.py 182 42 504 18 51 2 2023-12-28 2025-04-27 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/config/gpt_init_model_parameters.py 641 94 493 7 113 2 2024-01-08 2025-05-08 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/config/exceptions.py 63 15 511 38 17 2 2023-12-21 2025-04-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/config/log_config.py 28 4 504 48 5 2 2023-12-28 2025-03-28 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/config/uvicorn_config.py 23 3 504 44 3 2 2023-12-28 2025-04-01 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/config/task_type.py 55 6 380 228 6 1 2024-04-30 2024-09-29 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/start_server.py 121 30 511 37 39 2 2023-12-21 2025-04-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/structure/request_extractor.py 169 14 451 80 14 1 2024-02-19 2025-02-24 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/embedding/embedding_endpoint.py 55 13 428 133 13 1 2024-03-13 2025-01-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/embedding/backend_embedding_app.py 39 1 72 72 1 1 2025-03-04 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/embedding/embedding_type.py 6 1 228 228 1 1 2024-09-29 2024-09-29 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/embedding/frontend_embedding_app.py 28 2 72 44 2 1 2025-03-04 2025-04-01 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tokenizer/tokenization_chatglm2.py 134 2 504 189 2 2 2023-12-28 2024-11-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tokenizer/tokenization_chatglm4.py 135 1 189 189 1 1 2024-11-07 2024-11-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/tokenizer/tokenization_qwen.py 171 3 504 423 3 2 2023-12-28 2024-03-18 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/tokenizer/tokenization_chatglm.py 292 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/tokenizer/tokenization_chatglm3.py 229 5 504 189 6 2 2023-12-28 2024-11-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/model_loader/ffn_weight.py 230 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/weight_only_quant_weight.py 70 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/load_config.py 125 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/w8a8_weight.py 65 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/weight_module.py 430 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/__init__.py 10 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/model_weight_info.py 394 2 8 7 2 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/omni_quant_weight.py 207 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/static_fp8_quant_weight.py 262 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/smooth_quant_weight.py 342 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/group_wise_quant_weight.py 256 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/loader.py 187 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/per_block_fp8_quant_weight.py 234 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/attn_weight.py 46 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_loader/per_tensor_int8_quant_weight.py 221 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderer_factory.py 63 7 471 287 8 1 2024-01-30 2024-08-01 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/chatglm4_renderer.py 88 4 337 283 5 1 2024-06-12 2024-08-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/llama_template.py 733 3 490 423 5 1 2024-01-11 2024-03-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent_renderer.py 222 10 316 147 12 1 2024-07-03 2024-12-19 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/__init__.py 17 9 471 76 9 1 2024-01-30 2025-02-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_renderer.py 453 38 493 38 42 3 2024-01-08 2025-04-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/base.py 332 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/qwenvl_dashscope.py 90 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/qwen_dashscope.py 197 2 317 315 2 1 2024-07-02 2024-07-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/function_calling.py 358 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/__init__.py 36 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/text_base.py 19 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/openvino.py 118 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/schema.py 92 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/llm/oai.py 99 1 317 317 2 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/settings.py 9 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/__init__.py 1 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/tool_function_converter/__init__.py 3 1 76 76 1 1 2025-02-28 2025-02-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/tool_function_converter/response_converter.py 58 1 76 76 2 1 2025-02-28 2025-02-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/tool_function_converter/request_converter.py 152 1 76 76 2 1 2025-02-28 2025-02-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/parallel_executor.py 26 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/str_processing.py 21 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/utils.py 278 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/utils/tokenization_qwen.py 153 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/__init__.py 3 2 317 312 2 1 2024-07-02 2024-07-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent/log.py 17 1 317 317 1 1 2024-07-02 2024-07-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/internvl_renderer.py 151 5 258 139 6 1 2024-08-30 2024-12-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_vl_renderer.py 99 16 492 143 17 1 2024-01-09 2024-12-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/llava_renderer.py 150 18 490 135 19 1 2024-01-11 2024-12-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/basic_renderer.py 130 19 493 92 25 3 2024-01-08 2025-02-12 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/openai/renderers/qwen_agent_tool_renderer.py 65 2 76 73 5 1 2025-02-28 2025-03-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/fast_chat_renderer.py 42 3 482 423 5 1 2024-01-19 2024-03-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/minicpmv_renderer.py 84 2 248 231 2 1 2024-09-09 2024-09-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/custom_renderer.py 851 65 493 38 99 3 2024-01-08 2025-04-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/openai/renderers/cogvlm2_render.py 68 7 335 283 7 1 2024-06-14 2024-08-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/conversation.py 1228 4 482 258 4 1 2024-01-19 2024-08-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/llama_template_renderer.py 61 4 490 423 6 1 2024-01-11 2024-03-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/renderers/qwen_v2_audio_renderer.py 75 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/openai/openai_endpoint.py 249 65 504 65 75 3 2023-12-28 2025-03-11 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/openai/api_datatype.py 183 33 504 72 37 3 2023-12-28 2025-03-04 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/openai/renderer_factory_register.py 7 1 471 471 1 1 2024-01-30 2024-01-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/model_factory.py 213 35 511 7 37 3 2023-12-21 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/backend_server.py 207 7 72 8 7 1 2025-03-04 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/vit_rpc_server.py 51 1 154 154 1 1 2024-12-12 2024-12-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/backend_app.py 196 4 72 17 4 1 2025-03-04 2025-04-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/misc.py 66 7 380 133 8 1 2024-04-30 2025-01-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/frontend_server.py 253 6 72 17 6 1 2025-03-04 2025-04-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/frontend_app.py 163 3 72 25 3 1 2025-03-04 2025-04-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/server/frontend_worker.py 250 3 72 27 3 1 2025-03-04 2025-04-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/aios/kmonitor/python_client/flume/ttypes.py 92 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/flume/__init__.py 1 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/flume/pyflume.py 56 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/flume/ThriftSourceProtocol.py 314 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/metrics/metric_factory.py 14 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/metrics/gauge_metric.py 19 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/metrics/acc_metric.py 40 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/metrics/metric_base.py 17 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/utils/hippo_helper.py 36 2 504 199 2 2 2023-12-28 2024-10-28 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/aios/kmonitor/python_client/kmonitor/qps_metric.py 25 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/aios/kmonitor/python_client/kmonitor/kmonitor.py 38 2 504 408 2 2 2023-12-28 2024-04-02 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/aios/kmonitor/python_client/kmonitor/report_worker.py 94 4 504 192 4 3 2023-12-28 2024-11-04 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/eplb/ep_balancer.py 182 4 25 8 6 1 2025-04-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/eplb/eplb.py 108 2 25 20 2 1 2025-04-20 2025-04-25 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/plugins/ret_hidden_states.py 5 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/ops/rtp_llm/rtp_llm_op.py 38 16 394 35 17 1 2024-04-16 2025-04-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/ops/libth_transformer.pyi 407 9 90 7 9 1 2025-02-14 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/ops/__init__.py 52 19 504 25 21 3 2023-12-28 2025-04-20 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/ops/comm/parallel_op.py 44 2 402 380 2 1 2024-04-08 2024-04-30 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/ops/comm/nccl_op.py 25 8 504 8 8 2 2023-12-28 2025-05-07 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/model_factory_register.py 82 11 504 238 11 2 2023-12-28 2024-09-19 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/kserve_server.py 44 2 444 72 2 2 2024-02-26 2025-03-04 zibai.gj@alibaba-inc.com rtp-llm@alibaba maga_transformer/cpp/metrics/KmonParam.h 32 2 318 307 2 1 2024-07-01 2024-07-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/metrics/RtpLLMMetrics.h 394 28 369 25 28 1 2024-05-11 2025-04-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/metrics/KmonParam.cc 70 5 318 8 5 1 2024-07-01 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/metrics/RtpLLMMetrics.cc 360 34 369 8 36 1 2024-05-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/allocator_torch.h 38 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/Dispatch.h 208 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuggemm/cuggemm.h 36 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuggemm/cuggemm.cc 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/allocator_cuda.cc 145 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/ExpertAttentionUtil.h 180 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_type_utils.cuh 378 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/allocator_torch.cc 39 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_fp8_utils.h 189 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/trt_utils.h 107 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_fmha_utils.h 162 2 8 7 2 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublas.h 3 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasAlgoMap.cc 163 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasFP8MMWrapper.h 144 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasAlgoMap.h 74 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasFP8MMWrapper.cc 882 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasMMWrapper.cc 912 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cublas/cublasMMWrapper.h 236 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/custom_ar/custom_ar_comm.cc 244 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/custom_ar/custom_ar_comm.h 50 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_utils.h 416 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/reduce_kernel_utils.cuh 338 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cufmha/cufmha.h 149 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cufmha/cufmha.cc 440 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cufmha/fmha_profiling_interface.h 183 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nccl/nccl_utils_torch.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nccl/nccl_utils.cc 343 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nccl/nccl_utils.h 85 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nccl/nccl_utils_torch.cc 62 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/allocator_cuda.h 69 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/quantize_utils.h 93 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_utils.cc 683 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_bf16_fallbacks.cuh 277 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/comm_buffer/comm_buffer.cc 145 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/comm_buffer/comm_buffer.h 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/cuda_fp8_utils.cu 494 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/memory_utils.h 98 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/memory_utils.cu 753 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/ExpertAttentionUtil.cc 68 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nvtx/kernel_profiler.h 28 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nvtx/kernel_profiler.cc 39 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nvtx/nvtx_utils.h 62 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cuda/nvtx/nvtx_utils.cc 74 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/ErrorCode.h 211 12 199 30 13 1 2024-10-28 2025-04-15 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/DFAUtil.h 79 3 56 51 3 1 2025-03-20 2025-03-25 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/utils.h 62 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/AtomicUtil.h 17 1 199 199 1 1 2024-10-28 2024-10-28 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/StringUtil.h 91 7 357 18 7 1 2024-05-23 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/StackTrace.h 5 3 185 8 3 1 2024-11-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/activation_types.h 42 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/StackTrace.cc 31 4 185 8 4 1 2024-11-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/RopeConfig.h 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/layernorm_types.h 39 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/PyUtils.h 18 3 188 184 4 1 2024-11-08 2024-11-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/PyUtils.cc 60 3 188 184 3 1 2024-11-08 2024-11-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/Cm2Config.h 16 1 189 189 1 1 2024-11-07 2024-11-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/Logger.cc 86 2 188 64 2 1 2024-11-08 2025-03-12 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/quantization.h 215 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/StatusUtil.h 46 5 188 8 5 1 2024-11-08 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/LinearBiasUtil.h 52 3 321 8 3 1 2024-06-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/SignalUtils.cc 70 5 217 8 5 1 2024-10-10 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/PairUnorderedMap.h 31 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/ScopeGuard.h 21 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/EnumUtils.h 39 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/compiler_config.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/RpcErrorCode.h 85 1 163 163 1 1 2024-12-03 2024-12-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/Exception.h 23 1 188 188 1 1 2024-11-08 2024-11-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/QuantInfo.h 71 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/AttentionWeight.h 22 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/MlaConfig.h 10 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/SignalUtils.h 8 3 217 185 3 1 2024-10-10 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/EplbConfig.h 9 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/TimeUtil.h 7 1 164 164 1 1 2024-12-02 2024-12-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/ShapeCheck.h 9 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/AssertUtils.h 37 3 188 8 3 1 2024-11-08 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/HashUtil.h 16 3 199 170 3 1 2024-10-28 2024-11-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/Logger.h 185 7 199 8 7 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/Exception.cc 53 1 188 188 1 1 2024-11-08 2024-11-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/ShapeCheck.cc 25 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/KVCacheUtils.h 10 1 189 189 1 1 2024-11-07 2024-11-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/LRUCache.h 82 2 394 346 2 1 2024-04-16 2024-06-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/utils/NetUtil.h 21 3 199 170 3 1 2024-10-28 2024-11-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/GptModel.h 211 68 422 8 78 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/BaseLogitsProcessor.h 19 3 49 8 3 1 2025-03-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/GptModel.cc 1224 96 422 8 147 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/BaseLogitsProcessor.cc 15 3 49 8 3 1 2025-03-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/MTPModel.h 14 2 34 8 2 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/Sampler.h 22 20 422 8 24 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/ThinkModeLogitsProcessor.cc 55 3 49 8 4 1 2025-03-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/SampleInfos.h 72 2 49 8 3 1 2025-03-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/MTPModel.cc 46 2 34 8 2 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/ThinkModeLogitsProcessor.h 23 2 49 8 3 1 2025-03-27 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models/Sampler.cc 164 30 422 8 38 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingStream.cc 79 9 374 8 10 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingEngine.h 40 11 388 8 11 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/grpc/AllEmbeddingRpcServiceImpl.h 22 1 288 288 1 1 2024-07-31 2024-07-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/grpc/AllEmbeddingRpcServiceImpl.cc 29 2 288 8 2 1 2024-07-31 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingStream.h 54 10 374 8 11 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingQueryConverter.cc 37 6 374 8 6 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/handlers/LinearSoftmaxHandler.cc 58 9 363 8 10 1 2024-05-17 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/handlers/HandlerBase.h 32 8 374 8 8 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/handlers/LinearSoftmaxHandler.h 21 4 363 8 4 1 2024-05-17 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingQuery.h 64 9 374 8 9 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingScheduler.cc 64 5 374 8 5 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingExecutor.h 35 13 374 8 13 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/arpc/ArpcServerWrapper.h 15 1 288 288 1 1 2024-07-31 2024-07-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/arpc/ArpcServiceCreator.h 15 3 288 8 3 1 2024-07-31 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/arpc/ArpcServiceCreator.cc 15 3 288 8 3 1 2024-07-31 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/arpc/ArpcServerWrapper.cc 26 4 288 8 4 1 2024-07-31 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingExecutor.cc 232 25 374 8 27 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingScheduler.h 25 6 374 8 6 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingEngine.cc 82 19 388 8 20 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingQueryConverter.h 15 4 374 231 4 1 2024-05-06 2024-09-26 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/embedding_engine/EmbeddingQuery.cc 33 6 374 8 6 1 2024-05-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/banRepeatNgram.h 20 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/ban_bad_words.h 19 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/quantize_weight.cu 141 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/gen_relative_pos_bias.h 37 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/unfused_attention_kernels.cu 2425 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_penalty_kernels.cu 607 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/penalty_types.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/gpt_kernels.h 252 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/no_aux_tc_kernels.cu 646 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/decoder_masked_multihead_attention_utils.h 2737 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/vec_dtypes.cuh 1229 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_mul.h 562 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/banRepeatNgram.cu 164 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/custom_ar_kernels.h 56 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_convert_from_float.h 71 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/activation_kernels.cu 711 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_topk_kernels.cu 575 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/logprob_kernels.h 16 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/activation_kernels.h 88 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/activation_fp8_kernels.cu 235 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/stop_criteria_kernels.h 22 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_logn_attention.h 99 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/stop_criteria_kernels.cu 138 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/quantization_tensor.cu 188 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_convert_from_fp8.h 96 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/hello_world.cu 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rotary_position_embedding.h 720 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/layernorm_fp8_kernels.cu 998 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_topp_kernels.h 138 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/hello_world.h 11 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/unfused_attention_kernels.h 178 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/quantize_weight.h 15 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/kv_cache/kv_cache_index.h 36 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/kv_cache/kv_cache_utils.h 148 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/gpt_kernels.cu 1633 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/add_residual_kernels.cu 507 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/l1norm_kernels.cu 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_topp_kernels.cu 1458 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/layernorm_fp8_kernels.h 109 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_add.h 135 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_cast_to_int8.h 54 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/unfused_attention_fp8_kernels.cu 1012 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/gen_relative_pos_bias.cu 274 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/layernorm_kernels.h 48 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/activation_fp8_kernels.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/int8_utils.cuh 47 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_convert_to_fp8.h 63 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/alpha_layernorm_kernels.h 47 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/layernorm_kernels.cu 652 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/eplb/experts_stats_kernels.cu 126 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/eplb/experts_stats_kernels.h 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_penalty_kernels.h 74 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_sum_dot_zero.h 80 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/comm_buffer.h 45 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_vector_abs_max.h 38 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/sampling_topk_kernels.h 74 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention.cu 286 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention_launch.h 228 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention_template.h 1663 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention.h 149 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/logprob_kernels.cu 189 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/layernorm_kernels.py 51 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/aot_triton_kernel.bzl 252 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/aot_triton_kernels_linker.py 38 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/aot_triton_kernel_compiler.py 105 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/layernorm_kernels.h 15 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/triton/layernorm_kernels.cu 82 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/l1norm_kernels.h 10 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/moe_topKSoftmax_kernels.h 71 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_fma.h 525 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/add_residual_kernels.h 84 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/mla_kernels/mla_merge_transpose_kernel.cu 169 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/mla_kernels/mla_merge_transpose_kernel.h 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/no_aux_tc_kernels.h 9 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/moe_topKSoftmax_kernels.cu 798 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/comm_buffer.cu 105 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/ban_bad_words.cu 148 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/_convert_to_float.h 75 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/unfused_attention_fp8_kernels.h 135 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/custom_ar_kernels.cu 387 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/quantization_tensor.h 15 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/alpha_layernorm_kernels.cu 766 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rmsnormKernels.cu 443 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rocm/quantization_rocm.cu 514 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rocm/quantization_rocm.h 59 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rocm/layernorm_kernels.h 63 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rocm/layernorm_kernels.cu 1124 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/kernels/rmsnormKernels.h 34 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/lora/LoraManager.cc 129 9 289 8 9 1 2024-07-30 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/lora/LoraManager.h 47 10 289 8 10 1 2024-07-30 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/models_weight/W.h 143 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/position_ids_generator/PositionIdsGenerator.h 28 4 245 8 4 1 2024-09-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/position_ids_generator/PositionIdsGenerator.cc 102 2 232 8 2 1 2024-09-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/compute_occupancy.h 59 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/epilogue/collective/epilogue_moe_finalize.hpp 410 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/epilogue/thread/fused_activations.h 53 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/epilogue/threadblock/epilogue_per_row_per_col_scale.h 258 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/epilogue/threadblock/epilogue_tensor_op_int32.h 145 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fused_moe_kernel_routine.cuh 717 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/default_int8_traits.h 33 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/mixed_gemm_B_layout.h 69 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/moe_cutlass_kernel.h 395 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/splitk_gemm_grouped.h 301 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fpA_intB_gemm.h 375 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/gemm_moe_problem_visitor.h 34 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/gemm_with_epilogue_visitor.h 353 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/group_gemm_traits.h 31 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fused_moe_kernel.cuh 196 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fused_moe_kernel_traits.cuh 188 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/default_splitk_gemm_grouped.h 91 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/default_fpA_intB_traits.h 90 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/moe_cute_util.cuh 161 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/moe_sm90_traits.h 21 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/moe_problem_visitor.h 225 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/device/splitk_gemm_grouped.h 357 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/device/gemm_universal_base_compat.h 241 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/warp/mma_tensorop_compute_B_with_f16.h 156 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/warp/default_mma_tensor_op.h 41 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/warp/mma_tensorop_dequantizer.h 408 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/default_mma_bf16.h 189 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_base.h 112 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_pipelined.h 229 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/default_mma.h 152 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/default_dq_mma_pipelined.h 136 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_multistage_percol.h 364 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_multistage_finegrained.h 409 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/default_dq_mma.h 87 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_pipelined_finegrained.h 261 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/default_dq_mma_multistage.h 159 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/threadblock/dq_mma_multistage.h 41 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/transform/threadblock/fine_grained_scale_zero_iterator.h 143 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/arch/mma.h 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/arch/copy_red_global.hpp 205 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/interleaved_numeric_conversion.h 298 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/util/gather_tensor.hpp 118 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/tile_interleaved_layout.h 27 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/epilogue_helpers.h 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/interface.h 11 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/moe.bzl 261 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weight_only_quant_op.h 19 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/gemm_configs.h 118 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/cutlass_preprocessors.h 33 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_template.h 406 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm.h 76 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_bf16.cu 28 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_fp32.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_int32.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_fp16.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_gemm_kernels.h 167 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_gemm_hopper_input.cu 114 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_kernels.h 483 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_fp8_kernels.h 53 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_kernels.cu 1245 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_fp8_kernels.cu 418 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_gemm_kernels_template_sm90.h 152 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/launchers/moe_gemm_launcher_sm90.inl 247 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/launchers/fused_moe_gemm_launcher_sm80.inl 69 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/launchers/moe_gemm_launcher_sm90.h 16 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/launchers/fused_moe_gemm_launcher_sm80.h 9 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_kernels.inl 1005 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_gemm_kernels_template.h 878 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/kernel.h 111 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/utility.h 274 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/common.h 81 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/converter.h 60 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/int8SQ.cu 168 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/details.h 93 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/cudaCoreGemm.cu 249 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/cudaCoreGemm.h 51 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/fp8Gemm.h 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/kernelLauncher.h 75 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/kernelDispatcher.h 123 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/fp8Gemm.cu 148 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/int8SQ.h 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/group_gemm/group_gemm_fp32.cu 4 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/group_gemm/group_gemm_fp16.cu 4 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/group_gemm/group_gemm_template.h 230 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/group_gemm/group_gemm.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/group_gemm/group_gemm_bf16.cu 4 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/gemm_lut_utils.h 132 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/gemm_lut.cc 27 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/cutlass_preprocessors.cc 538 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int8_gemm_fg_scaleonly.cu 28 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int4_gemm_fg_scalebias.cu 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int4_gemm_per_col.cu 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int4_gemm_per_col.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int4_gemm_fg_scalebias.cu 27 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fpA_intB_gemm_template.h 494 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fpA_intB_gemm.h 90 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int8_gemm_fg_scalebias.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int4_gemm_fg_scaleonly.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int4_gemm_fg_scaleonly.cu 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fpA_intB_gemm_dummy_stubs.cu 31 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int8_gemm_fg_scaleonly.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int8_gemm_fg_scalebias.cu 29 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/bf16_int8_gemm_per_col.cu 28 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/fpA_intB_gemm/fp16_int8_gemm_per_col.cu 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/cutlass_heuristic.cc 553 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/gemm_lut.h 58 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/cutlass_type_conversion.h 86 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/cutlass_kernels/cutlass_heuristic.h 56 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/cutlass/gen.py 1104 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/EngineScheduleInfo.h 17 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/EngineInitParameter.cc 332 43 348 8 48 3 2024-06-01 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/EngineInitParameter.h 132 18 348 7 21 1 2024-06-01 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/Query.h 149 38 422 8 42 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/GenerateConfig.h 175 31 394 8 33 1 2024-04-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/EngineScheduleInfo.cc 15 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/LoadBalance.h 107 9 253 18 9 1 2024-09-04 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/LoadBalance.cc 95 6 253 8 6 1 2024-09-04 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/Query.cc 18 7 422 8 7 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/dataclass/MergedQuery.h 79 17 422 8 17 1 2024-03-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/HeartbeatSynchronizer.cpp 114 5 150 8 5 1 2024-12-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/HeartbeatSynchronizer.h 74 4 150 21 4 1 2024-12-16 2025-04-24 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/WorkerAwaredLoadBalancer.cpp 56 3 90 8 3 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/RRLoadBalancer.cpp 32 8 213 8 9 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/RRLoadBalancer.h 12 6 213 18 6 1 2024-10-14 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/BaseLoadBalancer.cpp 53 5 164 8 5 1 2024-12-02 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/WRRLoadBalancer.h 21 8 164 18 8 1 2024-12-02 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceManager.cpp 60 6 213 8 6 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/LocalSubscribeService.h 18 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceConfig.h 60 4 213 164 4 1 2024-10-14 2024-12-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceCreator.cpp 25 3 190 182 3 1 2024-11-06 2024-11-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceManager.h 17 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/LocalSubscribeService.cpp 27 5 213 8 5 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeService.h 10 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/TopoNode.h 15 2 213 164 2 1 2024-10-14 2024-12-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/TopoNode.cpp 9 2 213 164 2 1 2024-10-14 2024-12-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/NacosSubscribeService.cpp 43 2 183 8 2 1 2024-11-13 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceConfig.cpp 80 4 213 164 4 1 2024-10-14 2024-12-02 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/SubscribeServiceCreator.h 7 3 190 182 3 1 2024-11-06 2024-11-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/subscribe/NacosSubscribeService.h 18 1 183 183 1 1 2024-11-13 2024-11-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/WRRLoadBalancer.cpp 116 9 164 8 12 1 2024-12-02 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/WorkerAwaredLoadBalancer.h 25 2 90 38 2 1 2025-02-14 2025-04-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/load_balancer/BaseLoadBalancer.h 34 5 164 18 5 1 2024-12-02 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/metrics/CacheStoreMetricsCollector.cpp 211 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/metrics/CacheStoreMetricsCollector.h 119 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/metrics/CacheStoreMetricsReporter.h 48 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/metrics/CacheStoreMetricsReporter.cpp 141 4 213 8 4 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/MessagerServer.h 31 2 213 190 2 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheLoadServiceClosure.h 46 4 213 8 4 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/NoRdmaMemoryUtilImpl.cpp 21 6 213 8 6 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/LoadContext.h 65 3 167 72 3 1 2024-11-29 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/NormalCacheStore.cpp 199 8 213 8 8 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/Timer.cpp 25 1 190 190 1 1 2024-11-06 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/RequestBlockBufferStore.cpp 161 12 213 8 13 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/InitParams.h 18 5 213 8 5 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/TimerManager.cpp 34 1 190 190 1 1 2024-11-06 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/Interface.h 18 4 213 161 4 1 2024-10-14 2024-12-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CommonDefine.h 53 3 213 185 3 1 2024-10-14 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/LoadContext.cpp 147 4 167 8 4 1 2024-11-29 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheStoreServiceImpl.h 46 2 213 190 3 1 2024-10-14 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/Impl.cpp 28 4 213 161 4 1 2024-10-14 2024-12-05 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheLoadServiceClosure.cpp 90 5 213 8 5 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/NormalCacheStore.h 68 7 213 72 7 1 2024-10-14 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheStoreServiceImplContext.h 49 3 190 73 4 1 2024-11-06 2025-03-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/RequestBlockBuffer.cpp 110 6 213 8 8 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/RequestBlockBuffer.h 54 7 213 8 9 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/RequestBlockBufferStore.h 34 5 213 8 6 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/Timer.h 21 1 190 190 1 1 2024-11-06 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/MessagerServer.cpp 73 5 213 8 5 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/TimerManager.h 20 1 190 190 1 1 2024-11-06 2024-11-06 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/MessagerClient.cpp 126 8 213 8 8 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/MemoryUtil.h 15 5 213 75 5 1 2024-10-14 2025-03-01 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/proto/cache_store_service.proto 51 4 213 73 4 1 2024-10-14 2025-03-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheStoreServiceImpl.cpp 82 6 213 8 7 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheStore.h 36 5 167 72 5 1 2024-11-29 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/CacheStoreServiceImplContext.cpp 161 7 190 8 8 1 2024-11-06 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/NoRdmaMemoryUtilImpl.h 12 5 213 75 5 1 2024-10-14 2025-03-01 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/cache_store/MessagerClient.h 44 4 213 72 4 1 2024-10-14 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/common/UserRequest.h 13 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/common/TaskDescription.h 19 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/cluster/PrefillWorkerInfo.h 120 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/cluster/PrefillLoadBalancer.h 36 3 90 18 3 1 2025-02-14 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/cluster/PrefillLoadBalancer.cpp 160 5 90 8 5 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/PrefillTimeEstimator.cpp 24 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/PrefillTimeEstimator.h 22 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/LookupMapImpl.h 81 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/EstimatorConfig.h 24 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/LookupMapImpl.cpp 187 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/LookupPrefillEstimator.h 19 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/estimator/LookupPrefillEstimator.cpp 25 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/RtpLLMMasterEntry.cpp 92 3 90 8 3 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/MasterInitParameter.h 40 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/RandomRequestIdGenerator.h 27 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/Response.h 64 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/MasterInitParameter.cpp 34 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/Init.cpp 10 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/MasterHttpServer.cpp 102 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/MasterHttpServer.h 49 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/entry/RtpLLMMasterEntry.h 28 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/tokenize/RemoteTokenizeModule.cpp 69 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/disaggregate/rtpllm_master/tokenize/RemoteTokenizeModule.h 17 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/EmbeddingHandlerOp.h 32 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/RtpLLMOp.h 52 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/RtpEmbeddingOp.cc 122 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/RtpEmbeddingOp.h 49 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/RtpLLMOp.cc 218 2 8 7 2 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/multi_gpu_gpt/EmbeddingHandlerOp.cc 21 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/GptInitParameter.cc 378 2 8 7 2 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/common/InitEngineOps.h 7 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/common/NcclOp.h 20 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/common/InitEngineOps.cc 21 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/common/NcclOp.cc 44 1 8 8 2 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/common/CutlassConfigOps.cc 51 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/GptInitParameterRegister.h 7 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/GptInitParameter.h 220 2 8 7 2 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/th_utils.h 56 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/th_op/init.cc 20 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/tokenizer/Tokenizer.cc 45 3 114 96 3 1 2025-01-21 2025-02-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/tokenizer/Tokenizer.h 20 3 114 96 3 1 2025-01-21 2025-02-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/schedulers/BatchDecodeScheduler.h 133 3 35 8 3 1 2025-04-10 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/schedulers/FIFOScheduler.h 59 23 394 8 25 1 2024-04-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/schedulers/FIFOScheduler.cc 259 40 394 8 47 1 2024-04-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/schedulers/SchedulerBase.h 23 8 394 21 8 1 2024-04-16 2025-04-24 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/GenerateStream.h 289 39 245 8 45 1 2024-09-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/GenerateStream.cc 688 43 245 8 49 1 2024-09-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/StreamGroups.h 172 6 239 8 6 1 2024-09-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/CompleteTokenIds.h 42 10 133 8 10 1 2025-01-02 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/CompleteTokenIds.cc 172 12 133 8 12 1 2025-01-02 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/StreamCacheResource.cc 235 16 239 8 16 1 2024-09-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stream/StreamCacheResource.h 83 9 239 31 9 1 2024-09-18 2025-04-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/LocalRpcServer.cc 137 16 199 8 17 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/LocalRpcServiceImpl.h 61 6 199 8 6 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/DecodeGenerateContext.h 63 6 199 72 7 1 2024-10-28 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/PrefillGenerateContext.cc 156 14 199 8 14 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/PrefillRpcServer.h 42 8 199 8 8 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/LocalRpcServer.h 65 12 218 8 12 1 2024-10-09 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RemoteServerResource.h 16 4 199 72 4 1 2024-10-28 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/QueryConverter.cc 226 40 394 8 43 1 2024-04-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/GenerateContext.h 97 5 199 42 5 1 2024-10-28 2025-04-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/PrefillRpcServerRuntimeMeta.h 57 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RemoteRpcServiceImpl.h 69 4 199 8 4 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/GenerateContext.cc 47 2 199 90 2 1 2024-10-28 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/QueryConverter.h 24 8 394 8 8 1 2024-04-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/DecodeRpcServer.cc 638 21 218 8 26 1 2024-10-09 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RemoteRpcServiceImpl.cc 19 1 189 189 1 1 2024-11-07 2024-11-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/model_rpc_client.py 188 57 394 18 65 1 2024-04-16 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/PrefillRpcServer.cc 408 24 199 8 29 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/DecodeRpcServer.h 57 11 199 8 11 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RemoteRpcServer.h 26 5 199 8 5 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/PrefillGenerateContext.h 91 11 199 72 12 1 2024-10-28 2025-03-04 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/DecodeGenerateContext.cc 74 4 199 8 4 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RPCPool.h 68 7 199 8 7 1 2024-10-28 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/model_rpc/RemoteRpcServer.cc 83 11 218 8 12 1 2024-10-09 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/utils.h 8 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/include/fp8_gemm.cuh 387 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/include/utils.cuh 39 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/include/scheduler.cuh 87 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/include/tma_utils.cuh 84 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/include/mma_utils.cuh 809 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/DeepGemmPlugin.cpp 449 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/deep_gemm_template.h 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/def.bzl 26 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/deep_gemm/DeepGemmPlugin.h 15 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/multimodal_processor/RemoteMultimodalProcessor.h 97 3 154 8 3 1 2024-12-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/multimodal_processor/MultimodalProcessor.h 39 28 309 8 30 1 2024-07-10 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/multimodal_processor/MultimodalProcessor.cc 164 2 154 8 2 1 2024-12-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/multimodal_processor/LocalMultimodalProcessor.h 60 3 154 8 3 1 2024-12-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/TrackerAllocator.h 30 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/allocator.cc 6 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/torch_utils/torch_cuda_allocator.h 78 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/torch_utils/BufferTorchUtils.h 205 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/torch_utils/torch_cuda_allocator.cc 146 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/TrackerAllocator.cc 132 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/Event.h 18 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/BufferHelper.h 51 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/Types.cc 129 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/Types.h 78 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/cpu_allocator.cc 17 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/Buffer.cc 159 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/MemoryTracker.cc 127 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/MemoryTracker.h 42 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/allocator.h 40 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/QBuffer.h 72 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/Buffer.h 154 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/QBuffer.cc 129 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/core/cpu_allocator.h 18 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/ChatRender.cc 171 3 114 8 3 1 2025-01-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/ApiDataType.h 119 3 114 69 3 1 2025-01-21 2025-03-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/ApiDataType.cc 139 3 114 69 3 1 2025-01-21 2025-03-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/ChatRender.h 66 2 114 113 2 1 2025-01-21 2025-01-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/OpenaiEndpoint.h 30 3 114 8 3 1 2025-01-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/openai/OpenaiEndpoint.cc 120 5 114 8 5 1 2025-01-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/eplb/ExpertBalancer.h 109 3 25 8 3 1 2025-04-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/eplb/ExpertBalancerPythonWrapper.cc 37 1 25 25 1 1 2025-04-20 2025-04-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/eplb/ExpertBalancer.cc 273 3 25 8 3 1 2025-04-20 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/eplb/ExpertBalancerPythonWrapper.h 45 2 25 24 2 1 2025-04-20 2025-04-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/common/trtPluginsInterface.h 2 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/common/checkMacrosPlugin.cpp 13 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/common/checkMacrosPlugin.h 7 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/smoothQuantGemmPlugin/smoothQuantGemmPlugin.h 36 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/smoothQuantGemmPlugin/smoothQuantGemmPlugin.cpp 77 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/mixtureOfExperts/mixtureOfExpertsPlugin.cpp 130 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/mixtureOfExperts/mixtureOfExpertsPlugin.h 71 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/GroupGemmPlugin/GroupGemmPlugin.cpp 21 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/GroupGemmPlugin/GroupGemmPlugin.h 23 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/weightOnlyGroupwiseQuantMatmulPlugin/weightOnlyGroupwiseQuantMatmulPlugin.h 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/weightOnlyGroupwiseQuantMatmulPlugin/weightOnlyGroupwiseQuantMatmulPlugin.cpp 121 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/weightOnlyQuantMatmulPlugin/weightOnlyQuantMatmulPlugin.cpp 99 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/trt_plugins/weightOnlyQuantMatmulPlugin/weightOnlyQuantMatmulPlugin.h 59 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceFactory.cc 197 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceBase.cc 406 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/device_defs.bzl 50 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmSoftmaxOp.cc 331 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmGemmOp.cc 106 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmAttentionOp.cc 610 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmGemmOptOp.cc 145 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmDevice.cc 132 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmLayerNormOp.cc 1337 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmActOp.cc 126 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/arm_common.h 265 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/activation_const.hpp 33 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/ArmGemmKernel.h 200 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/gemm_microkernel_macro_m8_bf16.h 1173 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/ArmGemmThreadblock.cc 875 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/activation_macro.h 235 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/gemm_opt/ArmGemmPacking.cc 767 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmSampleOp.cc 319 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmEmbeddingLookup.cc 89 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmDevice.h 67 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmGemmKaiOp.cc 385 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/type_bf16/bfloat16_cmath_impl.hpp 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/type_bf16/bfloat16_impl.hpp 229 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/type_bf16/hie_bfloat16.hpp 330 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/type_bf16/hie_bfloat16_cmath.hpp 78 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/arm_impl/ArmWeights.cc 44 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/Weights.h 114 2 8 7 3 1 2025-05-07 2025-05-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/utils/DevicePerfWrapper.h 30 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/utils/DebugUtils.h 34 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/utils/DebugUtils.cc 338 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/utils/Timer.h 95 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/testing/TestBase.cc 5 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/testing/TestBase.h 354 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceData.h 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaBeamSearchOp.cc 71 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaLoraLinear.cc 243 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaDeviceRegister.cc 5 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/DeepEPBuffer.cc 603 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaGemmOp.cc 340 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaDeepEPLLFfnLayer.cc 104 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaMlaAttentionOp.cc 261 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaEmbeddingLookup.cc 36 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaLayernorm.cc 287 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaAddBiasOp.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaMlaContextAttention.cc 7 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaDevice.cc 619 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaFfnLayer.cc 393 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaSampleOp.cc 418 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaMlaQKVGemm.cc 10 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaGroupGemmOp.cc 62 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaDeepEPFfnLayer.cc 261 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaFlashInfer.h 77 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/DeepEPBuffer.h 130 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaLoraLinearWithActOp.cc 28 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/DeepEPDefs.h 252 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaWeights.cc 59 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaOps.cc 571 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaSoftmaxOp.cc 89 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaAttentionOp.cc 312 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaFP8Moe.cc 313 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaNvtxOp.cc 10 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaActOp.cc 102 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaQuantizeOp.cc 175 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaPrefillAttention.cc 269 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaFlashInfer.cc 469 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cuda_impl/CudaDevice.h 246 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/MhaQKVGemm.cc 49 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/AttentionLayer.cc 194 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/MlaAttentionLayer.cc 150 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/FfnLayer.cc 308 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/LoraLinear.cc 186 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/GroupGemm.cc 27 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_impl/LoraLinearWithActivation.cc 11 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/BufferManager.h 69 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceOps.h 78 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/RocmTestUtils.h 7 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/torch_hip_allocator.h 99 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/custom_ar_comm.cc 229 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmWeights.cc 117 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/custom_ar_comm.h 47 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmSampleOp.cc 266 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmGemmOp.cc 288 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmActOp.cc 86 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmOps.cc 54 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmAttentionOp.cc 385 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/torch_hip_allocator.cc 50 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmLoraLinearWithActOP.cc 132 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmSoftmaxOp.cc 70 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmDevice.cc 372 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmLayernorm.cc 265 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmAllocator.h 40 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmQuantizeOp.cc 91 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmFfnLayer.cc 166 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmDistributedOp.cc 93 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/rocm_impl/ROCmDevice.h 101 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/BufferManager.cc 172 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceBase.h 97 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/OpData.h 838 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceExport.h 45 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cpu_impl/CpuSampleOp.cc 432 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cpu_impl/CpuDevice.h 32 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/cpu_impl/CpuDevice.cc 273 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/CommonDefines.h 11 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceExport.cc 11 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/LoraWeights.h 188 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceFactory.h 46 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/DeviceOps.cc 204 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/OpData.cc 116 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/LayerNormTest.hpp 217 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/AttentionOpTest.hpp 243 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/GemmOpTest.hpp 236 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/FfnLayerTest.hpp 506 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/BeamSearchOpTest.hpp 88 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/GroupGemmOpTest.hpp 86 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/ActOpTest.hpp 91 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/DistributedTest.cc 86 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/GeneralOpsTest.hpp 266 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/AttentionLayerTest.hpp 118 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/SoftmaxOpTest.hpp 69 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/BasicDeviceTest.cc 20 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/base_tests/LoraLinearLayerTest.hpp 155 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/torch_impl/GptModel.hpp 157 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/torch_impl/BeamSearchOp.h 80 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/devices/torch_impl/FfnLayer.h 204 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/system_prompt/SystemPromptConstructor.cc 40 17 381 8 17 1 2024-04-29 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/system_prompt/SystemPromptConstructor.h 19 7 381 8 7 1 2024-04-29 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/system_prompt/SystemPrompt.h 34 5 381 163 5 1 2024-04-29 2024-12-03 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/SimpleHttpClient.cpp 89 5 182 8 5 1 2024-11-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/HandleHttpPacket.cpp 50 5 182 8 5 1 2024-11-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/HandleHttpPacket.h 26 2 182 148 2 1 2024-11-14 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/ConnectionPool.cpp 110 3 182 8 3 1 2024-11-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/SimpleHttpClient.h 44 4 182 85 4 1 2024-11-14 2025-02-19 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_client/ConnectionPool.h 30 2 182 148 2 1 2024-11-14 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpError.h 16 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpServer.h 37 4 266 247 4 3 2024-08-22 2024-09-10 tianyu.li@arm.com itej89@gmail.com maga_transformer/cpp/http_server/http_server/HttpRequest.cpp 34 6 261 120 6 1 2024-08-27 2025-01-15 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpResponseWriter.h 44 7 261 148 7 1 2024-08-27 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/ANetApp.h 26 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpRouter.h 26 5 266 156 5 3 2024-08-22 2024-12-10 tianyu.li@arm.com rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/ANetApp.cpp 39 1 261 261 1 1 2024-08-27 2024-08-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpRequest.h 31 6 261 120 6 1 2024-08-27 2025-01-15 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpServerAdapter.h 28 3 261 237 3 1 2024-08-27 2024-09-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpResponseWriter.cpp 127 7 261 148 7 1 2024-08-27 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpResponse.cpp 23 3 261 246 3 1 2024-08-27 2024-09-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpResponse.h 32 4 261 244 4 1 2024-08-27 2024-09-13 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpRequestWorkItem.cpp 17 2 261 248 2 1 2024-08-27 2024-09-09 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpRequestWorkItem.h 24 2 261 248 2 1 2024-08-27 2024-09-09 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpServerAdapter.cpp 116 3 261 237 3 1 2024-08-27 2024-09-20 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpServer.cpp 43 2 261 248 2 1 2024-08-27 2024-09-09 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/http_server/http_server/HttpRouter.cpp 45 3 261 247 3 2 2024-08-27 2024-09-10 rtp-llm@alibaba itej89@gmail.com maga_transformer/cpp/engine_base/EngineBase.cc 35 25 363 8 29 1 2024-05-17 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/engine_base/Executor.h 84 34 388 8 34 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/engine_base/EngineBase.h 61 21 386 8 22 1 2024-04-24 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/proto/create_grpc_proto.py 11 1 119 119 1 1 2025-01-16 2025-01-16 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/proto/model_rpc_service.proto 197 39 394 18 40 1 2024-04-16 2025-04-27 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/proto/embedding/all_embedding_rpc_service.proto 15 1 288 288 1 1 2024-07-31 2024-07-31 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/stats/ExpertStats.h 41 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/AccessLogWrapper.cc 248 6 148 8 7 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/InferenceService.h 78 3 148 8 3 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ApiServerMetrics.h 59 1 148 148 1 1 2024-12-18 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/GenerateStreamWrapper.cc 127 2 148 8 2 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/InferenceDataType.h 142 4 148 8 4 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/EmbeddingService.cc 117 6 147 8 7 1 2024-12-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ChatService.cc 186 3 114 8 3 1 2025-01-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/WeightsLoader.cc 21 2 85 8 3 1 2025-02-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/InferenceService.cc 321 4 148 8 4 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/SysCmdService.cc 37 2 185 8 2 1 2024-11-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/common/HealthService.cc 51 2 90 8 2 1 2025-02-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/common/HealthService.h 21 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ChatService.h 64 3 114 8 3 1 2025-01-21 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/GenerateStreamWrapper.h 37 2 148 8 2 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/GangServer.cc 109 2 85 8 2 1 2025-02-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ParallelInfo.h 90 3 174 83 3 1 2024-11-22 2025-02-21 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/LogLevelOps.h 5 1 185 185 1 1 2024-11-11 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/LoraService.cc 227 2 85 8 2 1 2025-02-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ModelStatusService.cc 27 1 185 185 1 1 2024-11-11 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/GangServer.h 25 1 85 85 1 1 2025-02-19 2025-02-19 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/TokenizerService.cc 85 3 174 8 3 1 2024-11-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/Exception.h 147 6 148 8 6 1 2024-12-18 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/WeightsLoader.h 14 2 85 8 2 1 2025-02-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/AccessLogWrapper.h 26 3 148 121 3 1 2024-12-18 2025-01-14 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/EmbeddingEndpoint.cc 91 6 154 8 7 1 2024-12-12 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ApiServerMetrics.cc 146 1 148 148 1 1 2024-12-18 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ConcurrencyControllerUtil.h 59 1 148 148 1 1 2024-12-18 2024-12-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ErrorResponse.cc 13 1 174 174 1 1 2024-11-22 2024-11-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/HttpApiServer.cc 354 14 213 8 16 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/EmbeddingService.h 33 2 147 125 2 1 2024-12-19 2025-01-10 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/SysCmdService.h 13 1 185 185 1 1 2024-11-11 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/TokenizerService.h 27 2 174 149 2 1 2024-11-22 2024-12-17 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ErrorResponse.h 14 1 174 174 1 1 2024-11-22 2024-11-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/ModelStatusService.h 14 1 185 185 1 1 2024-11-11 2024-11-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/LoraService.h 52 2 85 8 2 1 2025-02-19 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/TokenProcessor.cc 117 5 174 8 5 1 2024-11-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/TokenProcessor.h 40 4 174 113 4 1 2024-11-22 2025-01-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/EmbeddingEndpoint.h 34 4 213 120 4 1 2024-10-14 2025-01-15 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/LogLevelOps.cc 23 3 185 8 3 1 2024-11-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/WorkerStatusService.cc 47 2 188 8 2 1 2024-11-08 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/WorkerStatusService.h 45 3 188 21 3 1 2024-11-08 2025-04-24 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/TokenizerEncodeResponse.h 28 1 174 174 1 1 2024-11-22 2024-11-22 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/api_server/HttpApiServer.h 127 12 213 8 13 1 2024-10-14 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/quantizePreprocessors.h 30 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/12_int4_dequant_gemm_128x64x16x128_16_16x16_2x1_16x8x1_8x16x1_16_1x16x1x8_2_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/7_int4_dequant_gemm_64x16x16x128_16_16x16_1x1_8x8x1_8x8x1_16_1x16x1x4_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/1_int4_dequant_gemm_256x128x128x64_32_32x32_2x2_8x32x1_2x128x1_32_1x32x1x8_8_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/23_int4_dequant_gemm_128x64x32x128_32_32x32_1x1_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/30_int4_dequant_gemm_128x32x64x128_32_32x32_1x1_16x8x1_4x32x1_32_1x16x1x8_8_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/0_int4_dequant_gemm_256x128x128x128_32_32x32_2x2_16x16x1_4x64x1_32_1x32x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/31_int4_dequant_gemm_128x16x128x128_32_16x16_1x4_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/19_int4_dequant_gemm_128x16x128x128_32_16x16_1x4_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/3_int4_dequant_gemm_256x128x128x64_32_32x32_2x2_8x32x1_2x128x1_16_1x32x1x8_8_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/33_int4_dequant_gemm_256x16x256x128_32_16x16_1x4_16x8x1_4x32x1_32_1x16x1x16_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/25_int4_dequant_gemm_128x32x16x128_16_16x16_1x1_16x8x1_8x16x1_16_1x16x1x8_2_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/16_int4_dequant_gemm_128x16x32x128_32_16x16_1x1_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/int4_dequant_kernel_manifest.h 40 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/36_int4_dequant_gemm_256x128x128x64_32_32x32_4x1_8x32x1_2x128x1_32_1x32x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/29_int4_dequant_gemm_128x16x64x128_32_16x16_1x2_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/10_int4_dequant_gemm_128x128x16x128_16_16x16_4x1_16x8x1_8x16x1_16_1x16x1x8_2_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/5_int4_dequant_gemm_128x32x16x128_16_16x16_1x1_8x16x1_8x16x1_16_1x16x1x8_2_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/11_int4_dequant_gemm_128x64x32x128_32_32x32_1x1_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/37_int4_dequant_gemm_256x16x64x256_32_16x16_1x1_32x8x1_8x32x1_32_1x16x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/int4_dequant_comm.h 174 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/20_int4_dequant_gemm_128x32x128x128_32_32x32_1x2_16x8x1_4x32x1_32_1x16x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/13_int4_dequant_gemm_128x32x16x128_16_16x16_1x1_16x8x1_8x16x1_16_1x16x1x8_2_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/32_int4_dequant_gemm_128x32x128x128_32_32x32_1x2_16x8x1_4x32x1_32_1x16x1x8_8_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/28_int4_dequant_gemm_128x16x32x128_32_16x16_1x1_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/8_int4_dequant_gemm_128x16x32x128_32_16x16_1x1_8x16x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/18_int4_dequant_gemm_128x32x64x128_32_32x32_1x1_16x8x1_4x32x1_32_1x16x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/4_int4_dequant_gemm_256x128x128x64_32_32x32_2x2_8x32x1_2x128x1_16_1x32x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/21_int4_dequant_gemm_256x16x256x128_32_16x16_1x4_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/34_int4_dequant_gemm_256x32x256x128_32_32x32_1x2_16x16x1_4x64x1_32_1x16x1x16_8_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/26_int4_dequant_gemm_64x16x16x128_16_16x16_1x1_16x4x1_8x8x1_16_1x16x1x4_4_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/24_int4_dequant_gemm_128x64x16x128_16_16x16_2x1_16x8x1_8x16x1_16_1x16x1x8_2_intrawave_v4.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/9_int4_dequant_gemm_128x128x32x128_32_32x32_2x1_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/22_int4_dequant_gemm_256x32x256x128_32_32x32_1x2_16x16x1_4x64x1_32_1x16x1x16_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/17_int4_dequant_gemm_128x16x64x128_32_16x16_1x2_16x8x1_4x32x1_32_1x16x1x8_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/6_int4_dequant_gemm_64x16x16x128_16_16x16_1x1_16x4x1_8x8x1_16_1x16x1x4_4_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/int4_gemm_kernels/35_int4_dequant_gemm_256x128x128x64_32_32x32_2x2_8x32x1_2x128x1_32_1x32x1x8_8_intrawave_v3.cc 24 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hipblasMMWrapper.h 104 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmCKGemmWrapper.cc 134 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmMoeWrapper.h 40 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hipblasAlgoMap.cc 252 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hip_utils.cc 87 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmCKGemmWrapper.h 25 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hipblasAlgoMap.h 92 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hip_utils.h 233 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmFmhaWrapper.cc 228 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmFmhaWrapper.h 45 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/quantizePreprocessors.cc 491 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/amd_bfloat16.h 121 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/hipblasMMWrapper.cc 366 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/cuda_shims.h 94 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/rocm/rocmMoeWrapper.cc 106 1 8 8 1 1 2025-05-07 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeEngine.cc 576 34 388 8 44 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeScheduler.h 17 2 211 8 2 1 2024-10-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_sampler/SpeculativeSamplerOutput.h 21 2 263 8 2 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_sampler/RejectionSampler.h 19 5 263 8 5 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_sampler/SpeculativeSampler.cc 16 5 263 8 5 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_sampler/RejectionSampler.cc 151 18 263 8 21 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_sampler/SpeculativeSampler.h 21 3 263 8 3 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeStreamOutput.h 85 8 263 8 8 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeEngine.h 87 18 388 27 23 1 2024-04-22 2025-04-18 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeScheduler.cc 24 2 211 188 2 1 2024-10-16 2024-11-08 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/MTPStream.h 110 3 34 8 3 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/MTPBatchStreamProcessor.cc 51 2 34 8 2 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/VanillaStream.h 74 16 263 8 19 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/VanillaExecutor.cc 45 10 263 8 10 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/ProposeOutput.h 28 4 263 34 5 1 2024-08-25 2025-04-11 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/DeterministicExecutor.cc 139 12 211 8 14 1 2024-10-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/ProposeExecutor.h 31 7 263 8 8 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/MTPBatchStreamProcessor.h 11 2 34 8 2 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/ProposeExecutor.cc 29 4 263 8 4 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/VanillaExecutor.h 46 6 263 8 7 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/MTPExecutor.h 64 2 34 8 2 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/MTPExecutor.cc 39 3 34 8 3 1 2025-04-11 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/DeterministicExecutor.h 41 6 211 8 8 1 2024-10-16 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/propose_executor/ProposeDynamicConfig.h 7 1 263 263 1 1 2024-08-25 2024-08-25 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_updater/SpeculativeUpdaterConfig.h 11 1 263 263 1 1 2024-08-25 2024-08-25 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_updater/SpeculativeUpdaterConfig.cc 15 4 263 8 4 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_updater/SpeculativeUpdater.cc 46 16 263 8 16 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/speculative_updater/SpeculativeUpdater.h 47 5 263 8 5 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/SpeculativeOnlineAdaptor.h 13 3 263 8 3 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreStream.h 74 20 263 8 20 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreExecutor.h 44 7 263 8 8 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreOutput.h 21 3 263 112 3 1 2024-08-25 2025-01-23 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreBatchStreamProcessor.h 15 4 263 8 4 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreExecutor.cc 63 8 263 8 8 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/speculative_engine/score_executor/ScoreBatchStreamProcessor.cc 143 11 263 8 12 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalEngine.cc 277 58 393 8 76 1 2024-04-17 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalGenerateStream.h 31 11 263 8 13 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalEngine.h 58 28 393 8 34 1 2024-04-17 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalExecutor.cc 179 45 388 8 54 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalExecutor.h 41 20 388 8 21 1 2024-04-22 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalBatchStreamProcessor.h 55 24 384 8 26 1 2024-04-26 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalBatchStreamProcessor.cc 415 65 384 8 81 1 2024-04-26 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/cpp/normal_engine/NormalGenerateStream.cc 150 25 263 8 27 1 2024-08-25 2025-05-07 rtp-llm@alibaba rtp-llm@alibaba maga_transformer/access_logger/log_utils.py 16 4 504 44 4 2 2023-12-28 2025-04-01 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/access_logger/json_util.py 13 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com maga_transformer/access_logger/access_logger.py 60 4 504 44 4 2 2023-12-28 2025-04-01 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/access_logger/py_access_log.py 52 2 504 91 2 2 2023-12-28 2025-02-13 xinfei.sxf@alibaba-inc.com rtp-llm@alibaba maga_transformer/_ft_pickler.py 225 1 504 504 1 1 2023-12-28 2023-12-28 xinfei.sxf@alibaba-inc.com xinfei.sxf@alibaba-inc.com rtpllm_master_py/stub/librtpllm_master.pyi 65 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba rtpllm_master_py/__init__.py 19 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba rtpllm_master_py/entry.py 65 1 90 90 1 1 2025-02-14 2025-02-14 rtp-llm@alibaba rtp-llm@alibaba