def compute_is_valid

def compute_is_valid_response()

in services/worker/src/worker/job_runners/split/is_valid.py [0:0]
36 lines of code
3 McCabe index (conditional complexity)

def compute_is_valid_response(dataset: str, config: str, split: str) -> IsValidResponse:
    """
    Get the response of /is-valid for one specific dataset split on huggingface.co.


    A dataset split is valid if any of the artifacts for any of the
    steps is valid.
    Args:
        dataset (`str`):
            A namespace (user or an organization) and a repo name separated
            by a `/`.
        config (`str`):
            A configuration name.
        split (`str`):
            A split name.
    Returns:
        `IsValidResponse`: The response (viewer, preview, search, filter, statistics).
    """
    logging.info(f"compute 'split-is-valid' response for {dataset=}")

    viewer = is_successful_response(
        dataset=dataset,
        config=config,
        split=None,
        kind=CONFIG_HAS_VIEWER_KIND,
    )
    preview = is_successful_response(
        dataset=dataset,
        config=config,
        split=split,
        kind=SPLIT_HAS_PREVIEW_KIND,
    )

    try:
        parquet_metadata_response = get_previous_step_or_raise(
            kind=CONFIG_PARQUET_METADATA_KIND,
            dataset=dataset,
            config=config,
        )
        features = parquet_metadata_response["content"]["features"]
        filter = True
        if isinstance(features, dict):
            search = len(get_indexable_columns(Features.from_dict(features))) > 0
        else:
            search = False
    except Exception:
        filter = False
        search = False

    statistics = is_successful_response(
        dataset=dataset,
        config=config,
        split=split,
        kind=SPLIT_HAS_STATISTICS_KIND,
    )

    return IsValidResponse(viewer=viewer, preview=preview, search=search, filter=filter, statistics=statistics)