in text-semantic-search/embeddings_extraction/etl/pipeline.py [0:0]
def get_source_query(limit=1000000): query = """