def fetch_ground_truths()

in src/kg_validator.py [0:0]


def fetch_ground_truths(conn):
    val_cursor = conn.cursor()

    val_data = val_cursor.execute(
        """
        SELECT ih.input AS keyword,
               p.url_hash,
               ih.use_count,
               p.url
          FROM moz_inputhistory ih
          JOIN moz_places p
            ON ih.place_id = p.id
          WHERE input != ''
          ORDER BY keyword, use_count DESC
        """
    ).fetchall()
    val_cursor.close()
    val_columns = ['keyword', 'url_hash', 'use_count', 'url']
    actuals_df = pd.DataFrame(val_data, columns=val_columns)
    return actuals_df.groupby('keyword')['url_hash'].agg(list).reset_index()