Path Lines of Code maga_transformer/cpp/api_server/HttpApiServer.cc 354 maga_transformer/cpp/api_server/InferenceService.cc 321 maga_transformer/cpp/api_server/TokenProcessor.h 40 maga_transformer/cpp/cuda/cublas/cublasFP8MMWrapper.cc 882 maga_transformer/cpp/cuda/cublas/cublasMMWrapper.cc 912 maga_transformer/cpp/cuda/cufmha/fmha_profiling_interface.h 183 maga_transformer/cpp/cuda/reduce_kernel_utils.cuh 338 maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fused_moe_kernel.cuh 196 maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/fused_moe_kernel_routine.cuh 717 maga_transformer/cpp/cutlass/cutlass_extensions/include/cutlass_extensions/gemm/kernel/mixed_gemm_B_layout.h 69 maga_transformer/cpp/cutlass/cutlass_kernels/int8_gemm/int8_gemm_template.h 406 maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/launchers/moe_gemm_launcher_sm90.inl 247 maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_fp8_kernels.cu 418 maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_kernels.cu 1245 maga_transformer/cpp/cutlass/cutlass_kernels/moe_gemm/moe_kernels.inl 1005 maga_transformer/cpp/cutlass/cutlass_kernels/weightOnlyBatchedGemv/kernelDispatcher.h 123 maga_transformer/cpp/devices/Weights.h 114 maga_transformer/cpp/devices/arm_impl/ArmDevice.cc 132 maga_transformer/cpp/devices/arm_impl/ArmGemmKaiOp.cc 385 maga_transformer/cpp/devices/arm_impl/gemm_opt/ArmGemmKernel.h 200 maga_transformer/cpp/devices/arm_impl/gemm_opt/ArmGemmThreadblock.cc 875 maga_transformer/cpp/devices/cuda_impl/CudaAttentionOp.cc 312 maga_transformer/cpp/devices/cuda_impl/CudaDeepEPFfnLayer.cc 261 maga_transformer/cpp/devices/cuda_impl/CudaDeepEPLLFfnLayer.cc 104 maga_transformer/cpp/devices/cuda_impl/CudaFfnLayer.cc 393 maga_transformer/cpp/devices/cuda_impl/CudaGemmOp.cc 340 maga_transformer/cpp/devices/cuda_impl/CudaOps.cc 571 maga_transformer/cpp/devices/cuda_impl/DeepEPDefs.h 252 maga_transformer/cpp/devices/rocm_impl/ROCmFfnLayer.cc 166 maga_transformer/cpp/disaggregate/cache_store/MessagerClient.cpp 126 maga_transformer/cpp/disaggregate/rtpllm_master/cluster/PrefillLoadBalancer.cpp 160 maga_transformer/cpp/disaggregate/rtpllm_master/tokenize/RemoteTokenizeModule.cpp 69 maga_transformer/cpp/kernels/activation_fp8_kernels.cu 235 maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention.h 149 maga_transformer/cpp/kernels/decoder_masked_multihead_attention/decoder_masked_multihead_attention_template.h 1663 maga_transformer/cpp/kernels/decoder_masked_multihead_attention_utils.h 2737 maga_transformer/cpp/kernels/gpt_kernels.cu 1633 maga_transformer/cpp/kernels/layernorm_fp8_kernels.cu 998 maga_transformer/cpp/kernels/moe_topKSoftmax_kernels.cu 798 maga_transformer/cpp/kernels/no_aux_tc_kernels.cu 646 maga_transformer/cpp/kernels/sampling_penalty_kernels.cu 607 maga_transformer/cpp/kernels/sampling_topk_kernels.cu 575 maga_transformer/cpp/kernels/triton/aot_triton_kernel.bzl 252 maga_transformer/cpp/kernels/unfused_attention_fp8_kernels.cu 1012 maga_transformer/cpp/kernels/unfused_attention_kernels.cu 2425 maga_transformer/cpp/models/GptModel.cc 1224 maga_transformer/cpp/normal_engine/NormalGenerateStream.cc 150 maga_transformer/cpp/position_ids_generator/PositionIdsGenerator.h 28 maga_transformer/cpp/rocm/quantizePreprocessors.cc 491 maga_transformer/cpp/rocm/rocmFmhaWrapper.cc 228 maga_transformer/cpp/rocm/rocmMoeWrapper.cc 106 maga_transformer/cpp/schedulers/FIFOScheduler.h 59 maga_transformer/cpp/stream/GenerateStream.cc 688 maga_transformer/cpp/trt_plugins/mixtureOfExperts/mixtureOfExpertsPlugin.cpp 130 maga_transformer/cpp/trt_plugins/smoothQuantGemmPlugin/smoothQuantGemmPlugin.cpp 77 maga_transformer/device/device_impl.py 305 maga_transformer/model_factory.py 213 maga_transformer/models/base_model.py 467 maga_transformer/models/downstream_modules/classifier/classifier.py 45 maga_transformer/models/minicpmv/modeling_navit_siglip.py 566 maga_transformer/models/minicpmv/resampler.py 565 maga_transformer/openai/api_datatype.py 183 maga_transformer/openai/renderers/qwen_agent/llm/base.py 332 maga_transformer/openai/renderers/qwen_agent/llm/qwen_dashscope.py 197 maga_transformer/server/frontend_worker.py 250