def compare

def compare_json()

in microservices/matching_service/src/utils/json_matching/match_json.py [0:0]
67 lines of code
31 McCabe index (conditional complexity)

def compare_json(application_json_obj, supporting_json_obj, sd_doc_type,
                 af_doc_type, context):
  """Function takes two JSON files, 1. application form JSON and 2.
   supporting doc JSON file
  Args:
  Returns: json object with a dictionary expressing the matching score.
  """
  try:
    # Get the doc type for application doc and supporting doc
    support_doc_type = sd_doc_type.lower()
    app_doc_type = af_doc_type.lower()
    state = context.lower()
    #out_sd_dict = []
    # Both JSON should be available for comparison

    # run the comparison for = total keys in the supporting docs
    app_df = pd.DataFrame(application_json_obj)
    app_keys = list(app_df['entity'])
    Logger.info(app_keys)
    support_df = pd.DataFrame(supporting_json_obj)
    support_df['matching_score'] = 0.0
    support_keys = list(support_df['entity'])
    Logger.info(support_keys)
    Logger.info(support_keys)
    if support_doc_type not in MATCHING_USER_KEYS_SUPPORTING_DOC:
      Logger.error('Unsupported supporting doc')
      return None

    support_doc_dict = MATCHING_USER_KEYS_SUPPORTING_DOC[support_doc_type]
    matched = []
    #not_found = []

    for u_key in support_doc_dict.keys():
      raw_score = 0.0
      # check if the user provided key is present in the both the docs
      # if found compare their respectives values
      if u_key in app_keys and u_key in support_keys:
        app_val = list(app_df.loc[app_df['entity'] == u_key, 'value'])[0]
        support_val = list(support_df.loc[support_df['entity'] == u_key,
                                          'value'])[0]
        if app_val and support_val:
          app_val = app_val.lower()
          support_val = support_val.lower()
          if app_val[-1] in ['\n', ' ']:
            app_val = app_val[:-1]

          if support_val[-1] in ['\n', ' ']:
            support_val = support_val[:-1]

          # 1. check for dates. date related keys contains value in tuple format
          if isinstance(support_doc_dict[u_key],
                        tuple):  # a key signifies a date
            raw_score = compare_dates(
                app_val, support_val,
                APPLICATION_DOC_DATE_FORMAT[app_doc_type][state],
                support_doc_dict[u_key][1])
            wt_score = raw_score * support_doc_dict[u_key][0]
            matched.append(round(wt_score, 2))

          # 2. match values with only integers
          # remove any special characters
          # and check if the remaining string is contains
          # # only digit
          # elif re.sub('[^A-Za-z0-9]+', '', support_val).isdigit() and \
          #             re.sub('[^A-Za-z0-9]+', '', app_val).isdigit():
          elif support_val.isdigit() and app_val.isdigit():
            raw_score = 1.0 if support_val == app_val else 0.0
            wt_score = raw_score * support_doc_dict[u_key]
            matched.append(round(wt_score, 2))

          # 3. match values with only characters
          else:
            # if a sentence apply fuzzy logic
            raw_score = float(fuzz.token_sort_ratio(support_val, app_val) / 100)
            wt_score = round(raw_score * support_doc_dict[u_key], 2)
            matched.append(wt_score)

          final_score = raw_score
        else:
          Logger.warning(f'Values related to keys are None: {u_key}')
          final_score = 0.0
      else:
        final_score = 0.0

      for i_dict in supporting_json_obj:
        if u_key == i_dict['entity']:
          i_dict['matching_score'] = final_score
          break

        else:
          # if matching_score key is not found that means no matching score has
          # been assigned earlier and in else case we put None to the keys
          # that are not specified by the user.
          if not 'matching_score' in i_dict:
            i_dict['matching_score'] = None
    avg_matching_score = {'Avg Matching Score': round(sum(matched), 2)}
    supporting_json_obj.append(avg_matching_score)

    return supporting_json_obj

  except Exception as e:
    Logger.error(e)
    return None