llama_rag/llama_rag_pipeline.ipynb local_inference/awq.ipynb