components/llm_service/notebooks/Config.ipynb (208 lines of code) (raw):
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "18679327-be5c-455c-95c5-bafaaf2bbfc0",
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import sys\n",
"import json\n",
"import inspect\n",
"\n",
"sys.path.append(\"../../common/src\")\n",
"sys.path.append(\"../src\")\n",
"os.chdir(\"../src\")"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "dee693e9-6bb0-405f-8bbf-716b2b2bb3cb",
"metadata": {},
"outputs": [],
"source": [
"!export PROJECT_ID=\"gcp-mira-develop\"\n",
"project = \"gcp-mira-develop\"\n",
"os.environ[\"PROJECT_ID\"] = project"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "3d91fd7d-6ab3-4355-90e7-bfa51be58d5c",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"INFO: [config/config.py:55 - <module>()] Namespace File not found, setting job namespace as default\n",
"INFO: [config/config.py:110 - <module>()] ENABLE_GOOGLE_LLM = True\n",
"INFO: [config/config.py:111 - <module>()] ENABLE_OPENAI_LLM = True\n",
"INFO: [config/config.py:112 - <module>()] ENABLE_COHERE_LLM = True\n",
"INFO: [config/config.py:113 - <module>()] ENABLE_GOOGLE_MODEL_GARDEN = True\n",
"INFO: [config/config.py:114 - <module>()] ENABLE_TRUSS_LLAMA2 = True\n",
"INFO: [config/config.py:130 - <module>()] LLM types loaded ['VertexAI-Text', 'VertexAI-Chat-Palm2V2', 'VertexAI-Chat-Palm2V2-Langchain', 'VertexAI-Chat-Palm2-32k', 'VertexAI-Chat-Palm2-32k-Langchain', 'OpenAI-GPT4', 'OpenAI-GPT3.5', 'Cohere']\n",
"INFO: [config/config.py:141 - <module>()] Embedding types loaded ['VertexAI-Embedding', 'OpenAI-Embedding']\n",
"INFO: [config/vector_store_config.py:40 - <module>()] Default vector store = [langchain_pgvector]\n",
"INFO: [config/vector_store_config.py:49 - <module>()] PG_HOST = [127.0.0.1]\n",
"INFO: [config/vector_store_config.py:50 - <module>()] PG_DBNAME = [pgvector]\n"
]
}
],
"source": [
"from config.model_config import ModelConfig"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "8d72a529-2a4e-44e7-8450-c44f45eaf4d6",
"metadata": {},
"outputs": [],
"source": [
"model_config_path = os.path.join(\"config\", \"models.json\")\n",
"model_config = ModelConfig(model_config_path)\n",
"model_config.read_model_config()"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "25a987f5-b796-492a-9b41-f37c117d3e87",
"metadata": {},
"outputs": [],
"source": [
"model_config.llm_models"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "9d59ce3b-e8de-46d2-8af1-3e64b3345fe4",
"metadata": {},
"outputs": [],
"source": [
"model_config.llm_model_providers"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "d3bd20ac-93bd-476d-a336-9eccd2ad4f03",
"metadata": {},
"outputs": [],
"source": [
"model_config.llm_embedding_models"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "c9c84257-d0e6-4b63-936a-0fa7b4907e5b",
"metadata": {},
"outputs": [],
"source": [
"from config import (VERTEX_AI_MODEL_GARDEN_LLAMA2_CHAT,\n",
" KEY_MODEL_ENDPOINT, KEY_MODEL_PARAMS,\n",
" KEY_IS_CHAT, KEY_ENABLED, KEY_PROVIDER,\n",
" PROVIDER_MODEL_GARDEN,\n",
" get_model_config, get_provider_value)\n",
"TEST_MODEL_GARDEN_CONFIG = { \n",
"VERTEX_AI_MODEL_GARDEN_LLAMA2_CHAT: {\n",
" KEY_PROVIDER: PROVIDER_MODEL_GARDEN,\n",
" KEY_MODEL_ENDPOINT: \"fake-endpoint\",\n",
" KEY_IS_CHAT: True,\n",
" KEY_MODEL_PARAMS: {\n",
" \"temperature\": 0.2,\n",
" \"max_tokens\": 900,\n",
" \"top_p\": 1.0,\n",
" \"top_k\": 10\n",
" },\n",
" KEY_ENABLED: True\n",
" }\n",
"}\n",
"get_model_config().llm_model_providers = {\n",
"PROVIDER_MODEL_GARDEN: TEST_MODEL_GARDEN_CONFIG\n",
"}\n",
"get_model_config().llm_models = TEST_MODEL_GARDEN_CONFIG"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "449d522c-b9ac-4a7e-af99-0b3fecd0b155",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"'fake-endpoint'"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"llm_type = VERTEX_AI_MODEL_GARDEN_LLAMA2_CHAT\n",
"get_provider_value(PROVIDER_MODEL_GARDEN, KEY_MODEL_ENDPOINT, llm_type)"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "8bc48f60-bfd7-418b-a661-78ea15ca369b",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"{'temperature': 0.2, 'max_tokens': 900, 'top_p': 1.0, 'top_k': 10}"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"get_provider_value(PROVIDER_MODEL_GARDEN,\n",
" KEY_MODEL_PARAMS, llm_type)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "1534ac16-cab4-4f64-b945-3c479d8c484b",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.13"
}
},
"nbformat": 4,
"nbformat_minor": 5
}