Path Lines of Code README.md 146 README_cn.md 125 benchmark/README.md 25 example/perf_test/ShareGPT_V3_test_data_lens.json 4002 maga_transformer/cpp/README.md 19 maga_transformer/cpp/kernels/decoder_masked_multihead_attention/mmha_notes.md 88 maga_transformer/test/model_test/README.md 13 maga_transformer/tools/quant/README.md 4 open_source/package/README.md 1 patches/boost/boost.patch 17 patches/flash_attention/0001-fix-fix-arch-80-compile.patch 39 patches/flash_attention/0002-fix-remove-torch-aten-dep.patch 135 patches/flash_attention/0003-fix-fix-is-local-judge.patch 31 patches/grpc/0001-Rename-gettid-functions.patch 70 patches/havenask/0001-fix-PrometheusSink-need-header.patch 20 patches/havenask/anet.patch 13 patches/havenask/cm2.patch 9 patches/havenask/havenask.patch 46 patches/kai/0001-add-a8w4-fp16-support.patch 1594 patches/nacos_sdk_cpp/nacos-compile.patch 24 patches/rules_python/0001-add-extra-data.patch 35 patches/rules_python/0001-fix-triton-and-pypi-wheel.patch 133 patches/rules_python/0001-xx.patch 24 patches/rules_python/0002-remove-import-from-rules_cc.patch 118 pyrightconfig.json 31 rtpllm_master_py/data/QWEN2_1.5B/A10_TP1_PP1_EP1_W16A16.json 91 rtpllm_master_py/data/QWEN2_14B/A10_TP1_PP1_EP1_W16A16.json 91 rtpllm_master_py/data/QWEN2_14B/PPU810E_TP1_PP1_EP1_W16A16.json 91 rtpllm_master_py/data/QWEN2_72B/H20_TP1_PP1_EP1_W4A4.json 139 rtpllm_master_py/develop.md 24