path # lines of code pyproject.toml 63 csrc/custom_ops/torch_bindings.cpp 17 csrc/custom_ops/dispatch_utils.h 45 csrc/custom_ops/dtype_fp8.cuh 32 csrc/custom_ops/custom_ops.h 17 csrc/custom_ops/quant_utils.cuh 520 csrc/custom_ops/kernels.cu 135 csrc/custom_ops/attention_generic.cuh 54 csrc/suffix_decoding/pybind.cc 21 csrc/suffix_decoding/int32_map.h 292 csrc/suffix_decoding/suffix_tree.h 61 csrc/suffix_decoding/suffix_tree.cc 431 projects/ulysses/offline_inference_ulysses.py 26 projects/swiftkv/offline_inference_swiftkv.py 22 projects/dynasor/openai_client.py 81 projects/dynasor/naive_client.py 105 projects/spec_dec/offline_inference_spec_dec.py 36 MANIFEST.in 2 arctic_inference/embedding/proto/inference.proto 69 arctic_inference/embedding/replica_manager.py 361 arctic_inference/embedding/generate_proto.py 51 arctic_inference/embedding/client.py 181 arctic_inference/embedding/replica.py 300 arctic_inference/dynasor/vllm_server.py 79 arctic_inference/dynasor/evaluator.py 676 arctic_inference/dynasor/entropy.py 101 arctic_inference/dynasor/util.py 22 arctic_inference/dynasor/cot.py 135 arctic_inference/dynasor/__init__.py 1 arctic_inference/dynasor/openai_server.py 272 arctic_inference/suffix_decoding/simulator.py 510 arctic_inference/suffix_decoding/cache.py 139 arctic_inference/suffix_decoding/__init__.py 2 arctic_inference/common/swiftkv/configs.py 11 arctic_inference/common/swiftkv/__init__.py 2 arctic_inference/common/__init__.py 1 arctic_inference/patching.py 41 arctic_inference/envs.py 18 arctic_inference/py_custom_ops.py 44 arctic_inference/vllm/swiftkv/llama_swiftkv.py 703 arctic_inference/vllm/swiftkv/__init__.py 2 arctic_inference/vllm/args.py 95 arctic_inference/vllm/plugin.py 23 arctic_inference/vllm/model_runner.py 634 arctic_inference/vllm/config.py 85 arctic_inference/vllm/structured_output.py 14 arctic_inference/vllm/spec_dec/fp8.py 252 arctic_inference/vllm/spec_dec/logits_processor_opt.py 67 arctic_inference/vllm/spec_dec/arctic_speculator.py 719 arctic_inference/vllm/spec_dec/arctic_proposer.py 116 arctic_inference/vllm/spec_dec/__init__.py 1 arctic_inference/vllm/spec_dec/vocab_parallel_embedding.py 346 arctic_inference/vllm/stats.py 36 arctic_inference/vllm/patches.py 57 arctic_inference/vllm/ulysses.py 401 arctic_inference/vllm/__init__.py 1 arctic_inference/__init__.py 1 arctic_inference/utils.py 12 setup.py 107 benchmark/embedding/benchmark_http.py 246 benchmark/embedding/benchmark.py 254 scripts/check_license.py 40 scripts/install_deps.py 48