local_inference/4bit_bnb.ipynb performance_optimization/torch_compile_with_torchao.ipynb local_inference/8bit_bnb.ipynb performance_optimization/torch_compile_with_torchao.ipynb local_inference/fp8-405B.ipynb performance_optimization/torch_compile_with_torchao.ipynb