in managed-connectivity/sample-custom-connector/src/bootstrap.py [0:0]
def write_jsonl(output_file, json_strings):
"""Writes a list of string to the file in JSONL format."""
# For simplicity, dataset is written into the one file. But it is not
# mandatory, and the order doesn't matter for Import API.
# The PySpark itself could dump entries into many smaller JSONL files.
# Due to performance, it's recommended to dump to many smaller files.
for string in json_strings:
output_file.write(string + "\n")