id: 1 unit: def __call__() file: src/chug/wds/decode.py start line: 0 end line: 0 size: 63 LOC McCabe index: 19 number of parameters: 3 id: 2 unit: def _process_anno_pages() file: src/chug/doc/doc_read_processor.py start line: 0 end line: 0 size: 62 LOC McCabe index: 27 number of parameters: 2 id: 3 unit: def collate() file: src/chug/common/collate.py start line: 0 end line: 0 size: 39 LOC McCabe index: 26 number of parameters: 1 id: 4 unit: def __call__() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 35 LOC McCabe index: 16 number of parameters: 2 id: 5 unit: def expand_urls() file: src/chug/common/urls.py start line: 0 end line: 0 size: 34 LOC McCabe index: 11 number of parameters: 2 id: 6 unit: def _decode_anno() file: src/chug/doc/doc_vqa_processor.py start line: 0 end line: 0 size: 34 LOC McCabe index: 7 number of parameters: 2 id: 7 unit: def _parse_split_info() file: src/chug/wds/dataset_info.py start line: 0 end line: 0 size: 32 LOC McCabe index: 9 number of parameters: 2 id: 8 unit: def _expand_maybe() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 31 LOC McCabe index: 12 number of parameters: 3 id: 9 unit: def __call__() file: src/chug/hfds/collate.py start line: 0 end line: 0 size: 23 LOC McCabe index: 14 number of parameters: 2 id: 10 unit: def create_loader_hf() file: src/chug/hfds/loader.py start line: 0 end line: 0 size: 20 LOC McCabe index: 1 number of parameters: 18 id: 11 unit: def expand_urls() file: src/chug/wds/helpers.py start line: 0 end line: 0 size: 20 LOC McCabe index: 6 number of parameters: 2 id: 12 unit: def __post_init__() file: src/chug/common/config.py start line: 0 end line: 0 size: 20 LOC McCabe index: 15 number of parameters: 1 id: 13 unit: def __init__() file: src/chug/doc/doc_vqa_processor.py start line: 0 end line: 0 size: 19 LOC McCabe index: 1 number of parameters: 10 id: 14 unit: def create_loader_wds() file: src/chug/wds/loader.py start line: 0 end line: 0 size: 18 LOC McCabe index: 1 number of parameters: 19 id: 15 unit: def get_pytorch_worker_seed() file: src/chug/common/random.py start line: 0 end line: 0 size: 18 LOC McCabe index: 8 number of parameters: 2 id: 16 unit: def __iter__() file: src/chug/wds/shardlists.py start line: 0 end line: 0 size: 17 LOC McCabe index: 9 number of parameters: 1 id: 17 unit: def __iter__() file: src/chug/wds/shardlists.py start line: 0 end line: 0 size: 17 LOC McCabe index: 8 number of parameters: 1 id: 18 unit: def from_arg() file: src/chug/common/config.py start line: 0 end line: 0 size: 17 LOC McCabe index: 1 number of parameters: 2 id: 19 unit: def _disable_decode() file: src/chug/hfds/loader.py start line: 0 end line: 0 size: 15 LOC McCabe index: 5 number of parameters: 1 id: 20 unit: def _expand_always() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 15 LOC McCabe index: 6 number of parameters: 3 id: 21 unit: def build_data_pipeline() file: src/chug/wds/pipeline.py start line: 0 end line: 0 size: 15 LOC McCabe index: 1 number of parameters: 0 id: 22 unit: def _expand_anno() file: src/chug/doc/doc_read_processor.py start line: 0 end line: 0 size: 15 LOC McCabe index: 5 number of parameters: 3 id: 23 unit: def _map_v2() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 14 LOC McCabe index: 8 number of parameters: 3 id: 24 unit: def get_dataset_size() file: src/chug/wds/dataset_info.py start line: 0 end line: 0 size: 14 LOC McCabe index: 4 number of parameters: 1 id: 25 unit: def __init__() file: src/chug/doc/doc_read_processor.py start line: 0 end line: 0 size: 14 LOC McCabe index: 1 number of parameters: 6 id: 26 unit: def run() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 13 LOC McCabe index: 5 number of parameters: 2 id: 27 unit: def __init__() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 13 LOC McCabe index: 1 number of parameters: 6 id: 28 unit: def prepare_text_input() file: src/chug/text/tokenization.py start line: 0 end line: 0 size: 12 LOC McCabe index: 1 number of parameters: 0 id: 29 unit: def _decode_anno() file: src/chug/doc/doc_read_processor.py start line: 0 end line: 0 size: 12 LOC McCabe index: 3 number of parameters: 2 id: 30 unit: def __call__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 12 LOC McCabe index: 2 number of parameters: 2 id: 31 unit: def set_default() file: src/chug/common/config.py start line: 0 end line: 0 size: 11 LOC McCabe index: 7 number of parameters: 3 id: 32 unit: def simclr() file: src/chug/common/config.py start line: 0 end line: 0 size: 11 LOC McCabe index: 1 number of parameters: 2 id: 33 unit: def __getitem__() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 10 LOC McCabe index: 3 number of parameters: 2 id: 34 unit: def _flatten_nested() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 10 LOC McCabe index: 7 number of parameters: 4 id: 35 unit: def create_text_preprocessor() file: src/chug/text/tokenization.py start line: 0 end line: 0 size: 10 LOC McCabe index: 1 number of parameters: 0 id: 36 unit: def invoke() file: src/chug/hfds/collate.py start line: 0 end line: 0 size: 9 LOC McCabe index: 5 number of parameters: 3 id: 37 unit: def flatten_bytes() file: src/chug/hfds/collate.py start line: 0 end line: 0 size: 9 LOC McCabe index: 9 number of parameters: 1 id: 38 unit: def __init__() file: src/chug/wds/shardlists.py start line: 0 end line: 0 size: 9 LOC McCabe index: 1 number of parameters: 0 id: 39 unit: def _get_value() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 9 LOC McCabe index: 4 number of parameters: 2 id: 40 unit: def create_loader_from_config_wds() file: src/chug/loader.py start line: 0 end line: 0 size: 9 LOC McCabe index: 1 number of parameters: 8 id: 41 unit: def __iter__() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 8 LOC McCabe index: 3 number of parameters: 1 id: 42 unit: def __post_init__() file: src/chug/common/types.py start line: 0 end line: 0 size: 8 LOC McCabe index: 4 number of parameters: 1 id: 43 unit: def merge() file: src/chug/common/config.py start line: 0 end line: 0 size: 8 LOC McCabe index: 6 number of parameters: 3 id: 44 unit: def imagenet() file: src/chug/common/config.py start line: 0 end line: 0 size: 8 LOC McCabe index: 1 number of parameters: 2 id: 45 unit: def _preprocess_image_pages() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 8 LOC McCabe index: 6 number of parameters: 3 id: 46 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 8 LOC McCabe index: 5 number of parameters: 2 id: 47 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 8 LOC McCabe index: 3 number of parameters: 2 id: 48 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 8 LOC McCabe index: 3 number of parameters: 2 id: 49 unit: def create_loader() file: src/chug/loader.py start line: 0 end line: 0 size: 8 LOC McCabe index: 1 number of parameters: 7 id: 50 unit: def create_loader_from_config_hf() file: src/chug/loader.py start line: 0 end line: 0 size: 8 LOC McCabe index: 1 number of parameters: 7 id: 51 unit: def __init__() file: src/chug/wds/filters.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 0 id: 52 unit: def dump_and_reraise() file: src/chug/wds/helpers.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 1 id: 53 unit: def envlookup() file: src/chug/common/urls.py start line: 0 end line: 0 size: 7 LOC McCabe index: 3 number of parameters: 1 id: 54 unit: def _subst_and_expand() file: src/chug/common/urls.py start line: 0 end line: 0 size: 7 LOC McCabe index: 3 number of parameters: 1 id: 55 unit: def clip() file: src/chug/common/config.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 2 id: 56 unit: def __repr__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 7 LOC McCabe index: 2 number of parameters: 1 id: 57 unit: def __init__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 7 LOC McCabe index: 3 number of parameters: 4 id: 58 unit: def __init__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 7 LOC McCabe index: 3 number of parameters: 4 id: 59 unit: def apply() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 3 id: 60 unit: def build_image_transforms() file: src/chug/image/transforms_factory.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 0 id: 61 unit: def build_transforms_image_timm() file: src/chug/image/build_transforms_image.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 0 id: 62 unit: def build_transforms_image_basic() file: src/chug/image/build_transforms_image.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 0 id: 63 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 7 LOC McCabe index: 3 number of parameters: 2 id: 64 unit: def python_bounding_rect() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 7 LOC McCabe index: 1 number of parameters: 1 id: 65 unit: def group_by_keys_nothrow() file: src/chug/wds/tariterators.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 66 unit: def decode_pdf_pages() file: src/chug/wds/decode.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 67 unit: def __init__() file: src/chug/wds/shardlists.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 68 unit: def text_input_to_target() file: src/chug/text/tokenization.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 69 unit: def get_next_valid_page_index() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 70 unit: def _decode_image_pages() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 71 unit: def _decode_pdf_pages() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 72 unit: def _expand_anno() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 6 LOC McCabe index: 4 number of parameters: 3 id: 73 unit: def apply() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 3 id: 74 unit: def create_image_preprocessor() file: src/chug/image/transforms_factory.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 75 unit: def build_transforms_doc_basic() file: src/chug/image/build_transforms_doc.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 76 unit: def build_transforms_doc_better() file: src/chug/image/build_transforms_doc.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 77 unit: def build_transforms_doc_nougat() file: src/chug/image/build_transforms_doc.py start line: 0 end line: 0 size: 6 LOC McCabe index: 1 number of parameters: 0 id: 78 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 6 LOC McCabe index: 3 number of parameters: 2 id: 79 unit: def set_interval_count() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 5 LOC McCabe index: 2 number of parameters: 2 id: 80 unit: def __init__() file: src/chug/hfds/collate.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 81 unit: def base_plus_ext() file: src/chug/wds/tariterators.py start line: 0 end line: 0 size: 5 LOC McCabe index: 2 number of parameters: 1 id: 82 unit: def tarfile_samples_nothrow() file: src/chug/wds/tariterators.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 2 id: 83 unit: def urldir() file: src/chug/wds/helpers.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 1 id: 84 unit: def decode_image_pages() file: src/chug/wds/decode.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 85 unit: def __init__() file: src/chug/wds/decode.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 86 unit: def create_image_decoder() file: src/chug/wds/decode.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 87 unit: def set_interval() file: src/chug/common/types.py start line: 0 end line: 0 size: 5 LOC McCabe index: 4 number of parameters: 2 id: 88 unit: def image_mode_to_chs() file: src/chug/common/config.py start line: 0 end line: 0 size: 5 LOC McCabe index: 3 number of parameters: 1 id: 89 unit: def split_sources() file: src/chug/common/config.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 90 unit: def seed_worker() file: src/chug/common/random.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 1 id: 91 unit: def tokenize() file: src/chug/text/tokenization.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 92 unit: def get_params() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 5 LOC McCabe index: 3 number of parameters: 1 id: 93 unit: def get_params() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 5 LOC McCabe index: 3 number of parameters: 1 id: 94 unit: def python_find_non_zero() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 1 id: 95 unit: def filter_missing() file: src/chug/task_pipeline/pipeline_doc_vqa.py start line: 0 end line: 0 size: 5 LOC McCabe index: 1 number of parameters: 0 id: 96 unit: def __init__() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 4 id: 97 unit: def __init__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 5 id: 98 unit: def apply() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 3 id: 99 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 0 id: 100 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 0 id: 101 unit: def _validate_cfgs() file: src/chug/loader.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 0 id: 102 unit: def filter_no_caption_or_no_image() file: src/chug/task_pipeline/pipeline_gtparse.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 0 id: 103 unit: def filter_incomplete() file: src/chug/task_pipeline/pipeline_image_text.py start line: 0 end line: 0 size: 4 LOC McCabe index: 1 number of parameters: 0 id: 104 unit: def __init__() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 3 LOC McCabe index: 1 number of parameters: 3 id: 105 unit: def log_and_continue() file: src/chug/wds/helpers.py start line: 0 end line: 0 size: 3 LOC McCabe index: 1 number of parameters: 1 id: 106 unit: def __post_init__() file: src/chug/common/config.py start line: 0 end line: 0 size: 3 LOC McCabe index: 2 number of parameters: 1 id: 107 unit: def prompt_end_pos() file: src/chug/text/tokenization.py start line: 0 end line: 0 size: 3 LOC McCabe index: 2 number of parameters: 3 id: 108 unit: def _squeeze_anno() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 3 LOC McCabe index: 3 number of parameters: 2 id: 109 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 3 LOC McCabe index: 1 number of parameters: 2 id: 110 unit: def __call__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 3 LOC McCabe index: 1 number of parameters: 2 id: 111 unit: def create_task_pipeline() file: src/chug/task_pipeline/pipeline_factory.py start line: 0 end line: 0 size: 3 LOC McCabe index: 1 number of parameters: 1 id: 112 unit: def __len__() file: src/chug/hfds/wrappers.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 113 unit: def get_error_handler() file: src/chug/wds/helpers.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 114 unit: def __len__() file: src/chug/wds/shardlists.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 115 unit: def __init__() file: src/chug/common/types.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 116 unit: def set_value() file: src/chug/common/types.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 117 unit: def get_value() file: src/chug/common/types.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 118 unit: def __iter__() file: src/chug/common/types.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 119 unit: def envsubst() file: src/chug/common/urls.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 120 unit: def image_chs() file: src/chug/common/config.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 121 unit: def empty() file: src/chug/common/config.py start line: 0 end line: 0 size: 2 LOC McCabe index: 2 number of parameters: 1 id: 122 unit: def source_to_shard_spec() file: src/chug/common/config.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0 id: 123 unit: def shard_spec() file: src/chug/common/config.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 124 unit: def _expand_anno() file: src/chug/doc/doc_vqa_processor.py start line: 0 end line: 0 size: 2 LOC McCabe index: 2 number of parameters: 3 id: 125 unit: def _decode_anno() file: src/chug/doc/doc_processor.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 126 unit: def __init__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 127 unit: def __call__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 128 unit: def get_transform_init_args_names() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 129 unit: def get_transform_init_args_names() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 130 unit: def get_transform_init_args_names() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 131 unit: def __init__() file: src/chug/image/transforms_alb.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 132 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 2 LOC McCabe index: 3 number of parameters: 2 id: 133 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 1 id: 134 unit: def __init__() file: src/chug/image/transforms_torch.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 2 id: 135 unit: def build_task_pipeline_gtparse() file: src/chug/task_pipeline/pipeline_gtparse.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0 id: 136 unit: def build_task_pipeline_manual() file: src/chug/task_pipeline/pipeline_manual.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0 id: 137 unit: def build_task_pipeline_doc_read() file: src/chug/task_pipeline/pipeline_doc_read.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0 id: 138 unit: def build_task_pipeline_doc_vqa() file: src/chug/task_pipeline/pipeline_doc_vqa.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0 id: 139 unit: def build_task_pipeline_image_text() file: src/chug/task_pipeline/pipeline_image_text.py start line: 0 end line: 0 size: 2 LOC McCabe index: 1 number of parameters: 0