in 04_streaming/transform/df03.py [0:0]
def tz_correct(line, airport_timezones):
fields = json.loads(line)
try:
# convert all times to UTC
dep_airport_id = fields["ORIGIN_AIRPORT_SEQ_ID"]
arr_airport_id = fields["DEST_AIRPORT_SEQ_ID"]
dep_timezone = airport_timezones[dep_airport_id][2]
arr_timezone = airport_timezones[arr_airport_id][2]
for f in ["CRS_DEP_TIME", "DEP_TIME", "WHEELS_OFF"]:
fields[f] = as_utc(fields["FL_DATE"], fields[f], dep_timezone)
for f in ["WHEELS_ON", "CRS_ARR_TIME", "ARR_TIME"]:
fields[f] = as_utc(fields["FL_DATE"], fields[f], arr_timezone)
yield json.dumps(fields)
except KeyError as e:
logging.exception(" Ignoring " + line + " because airport is not known")