in drqa/reader/utils.py [0:0]
def build_feature_dict(args, examples):
"""Index features (one hot) from fields in examples and options."""
def _insert(feature):
if feature not in feature_dict:
feature_dict[feature] = len(feature_dict)
feature_dict = {}
# Exact match features
if args.use_in_question:
_insert('in_question')
_insert('in_question_uncased')
if args.use_lemma:
_insert('in_question_lemma')
# Part of speech tag features
if args.use_pos:
for ex in examples:
for w in ex['pos']:
_insert('pos=%s' % w)
# Named entity tag features
if args.use_ner:
for ex in examples:
for w in ex['ner']:
_insert('ner=%s' % w)
# Term frequency feature
if args.use_tf:
_insert('tf')
return feature_dict