in cli/readme.py [0:0]
def main(args):
# get list of notebooks
notebooks = sorted(glob.glob("**/*.ipynb", recursive=True))
# make all notebooks consistent
modify_notebooks(notebooks)
# get list of jobs
jobs = sorted(glob.glob("jobs/**/*job*.yml", recursive=True))
jobs += sorted(glob.glob("jobs/basics/*.yml", recursive=False))
jobs += sorted(glob.glob("jobs/*/basics/**/*job*.yml", recursive=True))
jobs += sorted(glob.glob("jobs/pipelines/**/*pipeline*.yml", recursive=True))
jobs += sorted(glob.glob("jobs/spark/*.yml", recursive=False))
jobs += sorted(
glob.glob("jobs/automl-standalone-jobs/**/cli-automl-*.yml", recursive=True)
)
jobs += sorted(
glob.glob("jobs/pipelines-with-components/**/*pipeline*.yml", recursive=True)
)
jobs += sorted(
glob.glob("jobs/automl-standalone-jobs/**/*cli-automl*.yml", recursive=True)
)
jobs += sorted(glob.glob("responsible-ai/**/cli-*.yml", recursive=True))
jobs += sorted(glob.glob("jobs/parallel/**/*pipeline*.yml", recursive=True))
jobs = [
job.replace(".yml", "")
for job in jobs
if not any(excluded in job for excluded in EXCLUDED_JOBS)
]
jobs_using_registry_components = sorted(
glob.glob(
"jobs/pipelines-with-components/basics/**/*pipeline*.yml", recursive=True
)
)
jobs_using_registry_components = [
job.replace(".yml", "")
for job in jobs_using_registry_components
if not any(excluded in job.replace(os.sep, "/") for excluded in EXCLUDED_JOBS)
]
# get list of endpoints
endpoints = sorted(glob.glob("endpoints/**/*endpoint.yml", recursive=True))
endpoints = [
endpoint.replace(".yml", "")
for endpoint in endpoints
if not any(
excluded in endpoint.replace(os.sep, "/") for excluded in EXCLUDED_ENDPOINTS
)
]
# get list of resources
resources = sorted(glob.glob("resources/**/*.yml", recursive=True))
resources = [
resource.replace(".yml", "")
for resource in resources
if not any(
excluded in resource.replace(os.sep, "/") for excluded in EXCLUDED_RESOURCES
)
]
# get list of assets
assets = sorted(glob.glob("assets/**/*.yml", recursive=True))
assets = [
asset.replace(".yml", "")
for asset in assets
if not any(
excluded in asset.replace(os.sep, "/") for excluded in EXCLUDED_ASSETS
)
]
# get list of scripts
scripts = sorted(glob.glob("*.sh", recursive=False))
scripts = [
script.replace(".sh", "")
for script in scripts
if not any(
excluded in script.replace(os.sep, "/") for excluded in EXCLUDED_SCRIPTS
)
]
# get list of schedules
schedules = sorted(glob.glob("schedules/**/*schedule.yml", recursive=True))
schedules = [
schedule.replace(".yml", "")
for schedule in schedules
if not any(
excluded in schedule.replace(os.sep, "/") for excluded in EXCLUDED_SCHEDULES
)
]
# write workflows
write_workflows(
jobs,
jobs_using_registry_components,
endpoints,
resources,
assets,
scripts,
schedules,
)
# read existing README.md
with open("README.md", "r") as f:
readme_before = f.read()
# write README.md
write_readme(jobs, endpoints, resources, assets, scripts, schedules)
# read modified README.md
with open("README.md", "r") as f:
readme_after = f.read()
# check if readme matches
if args.check_readme:
if not check_readme(readme_before, readme_after):
print("README.md file did not match...")
exit(2)