in src/kg_validator.py [0:0]
def fetch_ground_truths(conn):
val_cursor = conn.cursor()
val_data = val_cursor.execute(
"""
SELECT ih.input AS keyword,
p.url_hash,
ih.use_count,
p.url
FROM moz_inputhistory ih
JOIN moz_places p
ON ih.place_id = p.id
WHERE input != ''
ORDER BY keyword, use_count DESC
"""
).fetchall()
val_cursor.close()
val_columns = ['keyword', 'url_hash', 'use_count', 'url']
actuals_df = pd.DataFrame(val_data, columns=val_columns)
return actuals_df.groupby('keyword')['url_hash'].agg(list).reset_index()