in python/dataproc_templates/elasticsearch/elasticsearch_to_bigtable.py [0:0]
def parse_args(args: Optional[Sequence[str]] = None) -> Dict[str, Any]:
parser: argparse.ArgumentParser = argparse.ArgumentParser()
parser.add_argument(
f'--{constants.ES_BT_INPUT_NODE}',
dest=constants.ES_BT_INPUT_NODE,
required=True,
help='Elasticsearch Node Uri'
)
parser.add_argument(
f'--{constants.ES_BT_INPUT_INDEX}',
dest=constants.ES_BT_INPUT_INDEX,
required=True,
help='Elasticsearch Index Name'
)
parser.add_argument(
f'--{constants.ES_BT_NODE_USER}',
dest=constants.ES_BT_NODE_USER,
help='Elasticsearch Node User'
)
parser.add_argument(
f'--{constants.ES_BT_NODE_PASSWORD}',
dest=constants.ES_BT_NODE_PASSWORD,
help='Elasticsearch Node Password'
)
parser.add_argument(
f'--{constants.ES_BT_NODE_API_KEY}',
dest=constants.ES_BT_NODE_API_KEY,
help='Elasticsearch Node API Key'
)
add_es_spark_connector_options(parser, constants.get_es_spark_connector_input_options("es.bt.input."))
parser.add_argument(
f'--{constants.ES_BT_FLATTEN_STRUCT}',
dest=constants.ES_BT_FLATTEN_STRUCT,
action='store_true',
required=False,
help='Flatten the struct fields'
)
parser.add_argument(
f'--{constants.ES_BT_FLATTEN_ARRAY}',
dest=constants.ES_BT_FLATTEN_ARRAY,
action='store_true',
required=False,
help=(
'Flatten the n-D array fields to 1-D array fields,'
f' it needs {constants.ES_BT_FLATTEN_STRUCT} to be true'
)
)
parser.add_argument(
f'--{constants.ES_BT_PROJECT_ID}',
dest=constants.ES_BT_PROJECT_ID,
required=True,
help='BigTable project ID'
)
parser.add_argument(
f'--{constants.ES_BT_INSTANCE_ID}',
dest=constants.ES_BT_INSTANCE_ID,
required=True,
help='BigTable instance ID'
)
parser.add_argument(
f'--{constants.ES_BT_CREATE_NEW_TABLE}',
dest=constants.ES_BT_CREATE_NEW_TABLE,
required=False,
help='BigTable create new table flag. Default is false.',
default=False
)
parser.add_argument(
f'--{constants.ES_BT_BATCH_MUTATE_SIZE}',
dest=constants.ES_BT_BATCH_MUTATE_SIZE,
required=False,
help='BigTable batch mutate size. Maximum allowed size is 100000. Default is 100.',
default=100
)
parser.add_argument(
f'--{constants.ES_BT_CATALOG_JSON}',
dest=constants.ES_BT_CATALOG_JSON,
required=True,
help='BigTable catalog inline json'
)
known_args: argparse.Namespace
known_args, _ = parser.parse_known_args(args)
if (not getattr(known_args, constants.ES_BT_NODE_API_KEY)
and (not getattr(known_args, constants.ES_BT_NODE_USER)
or not getattr(known_args, constants.ES_BT_NODE_PASSWORD))):
sys.exit("ArgumentParser Error: Either of es.bt.input.user and es.bt.input.password "
+ "OR es.bt.input.api.key needs to be provided as argument to read data from Elasticsearch")
elif (getattr(known_args, constants.ES_BT_NODE_API_KEY)
and (getattr(known_args, constants.ES_BT_NODE_USER)
or getattr(known_args, constants.ES_BT_NODE_PASSWORD))):
sys.exit("ArgumentParser Error: Both es.bt.input.user and es.bt.input.password "
+ "AND es.bt.input.api.key cannot be provided as arguments at the same time.")
return vars(known_args)