assets/large_language_models/rag/components/git_clone/spec.yaml (40 lines of code) (raw):
$schema: https://azuremlschemas.azureedge.net/latest/commandComponent.schema.json
type: command
tags:
Preview: ""
version: 0.0.77
name: llm_rag_git_clone
display_name: LLM - Clone Git Repo
is_deterministic: true
description: |
Clones a git repository to output_data path
inputs:
git_repository:
type: string
description: "The URL of the git repository"
branch_name:
type: string
optional: true
description: "The branch name to pull from the git repository, default picked by git if not specified."
authentication_key_prefix:
type: string
optional: true
description: "<PREFIX>-USER and <PREFIX>-PASS are the expected names of two Secrets in the Workspace Key Vault which will be used for authenticated when pulling the given git repo."
git_connection_id:
type: string
optional: true
description: "The connection id of the git provider to use."
outputs:
output_data:
type: uri_folder
description: "Uri folder containing all files from the git repo"
mode: upload
environment: azureml:llm-rag-embeddings@latest
code: '../src/'
command: >-
python -m azureml.rag.tasks.git_clone
--git-repository ${{inputs.git_repository}}
$[[--branch-name ${{inputs.branch_name}}]]
$[[--authentication-key-prefix ${{inputs.authentication_key_prefix}}]]
$[[--git-connection-id ${{inputs.git_connection_id}}]]
--output-data '${{outputs.output_data}}'