Skip to content

Commit

Permalink
test.py works
Browse files Browse the repository at this point in the history
  • Loading branch information
sammysignal committed Dec 10, 2015
1 parent 65747e3 commit 7b07339
Show file tree
Hide file tree
Showing 3 changed files with 36 additions and 6 deletions.
1 change: 0 additions & 1 deletion OptimizedEntityLinking/search.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,6 @@ def runLocalSearch(self, alpha, iterations):
candidateDocumentRelevances = []
currentLinkDocumentRelevances = []
context = [v[0] for k, v in state.items() if k != keyword]
print "entering loop"
for otherAssignedLink in context:
# get cached page
otherAssignedPage = self.retrieveCachedPage(candidateLink)
Expand Down
39 changes: 35 additions & 4 deletions test.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,10 +28,6 @@
totalKeywords = len(result.keys())
correctKeywords = 0
for k in result:
print result[k][0]
print currentSolution[k]
print type(result[k][0])
print type(currentSolution[k])
if result[k][0] == currentSolution[k]:
correctKeywords += 1

Expand All @@ -40,3 +36,38 @@
avg_accuracies.append(np.mean(accuracies))

print avg_accuracies



# import nltk
# with open('sample.txt', 'r') as f:
# sample = f.read()


# sentences = nltk.sent_tokenize(sample)
# tokenized_sentences = [nltk.word_tokenize(sentence) for sentence in sentences]
# tagged_sentences = [nltk.pos_tag(sentence) for sentence in tokenized_sentences]
# chunked_sentences = nltk.ne_chunk_sents(tagged_sentences, binary=True)

# def extract_entity_names(t):
# entity_names = []
# if hasattr(t, 'label') and t.label:
# if t.label() == 'NE':
# entity_names.append(' '.join([child[0] for child in t]))
# else:
# for child in t:
# entity_names.extend(extract_entity_names(child))
# return entity_names

# entity_names = []
# for tree in chunked_sentences:
# # Print results per sentence
# # print extract_entity_names(tree)
# print chunked_sentences
# entity_names.extend(extract_entity_names(tree))

# # Print all entity names
# # print entity_names

# # Print unique entity names
# print set(entity_names)
2 changes: 1 addition & 1 deletion test/solutions.txt
Original file line number Diff line number Diff line change
@@ -1,3 +1,3 @@
{"Thermodynamics":('Thermodynamics', 1), "study":('Study', 1), "heat":('Heat', 1)}
{"Airplane!":('Airplane!', 1), "movie":('movie', 1)}
{"China":('China', 1), "GDP":('Gross domestic product', 1)}
{"China":('China', 1), "country":('Country', 1), "GDP":('Gross domestic product', 1)}

0 comments on commit 7b07339

Please sign in to comment.