Skip to content

Commit dd3435e

Browse files
committed
creating a chart with similarity score for each other book in the set; run.py updated; .pdf file as an exapmle of the saving feature
1 parent 3a7cbf9 commit dd3435e

File tree

3 files changed

+16
-2
lines changed

3 files changed

+16
-2
lines changed
17.2 KB
Binary file not shown.

BooksSimilarity/run.py

+5-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
from prepare_texts import get_texts, read, preprocess, stemming
22
from words_occurrences import get_dict, bows, most_common, tf_idf
3+
from show_most_similar_books import show_similaryty_chart
34

45

56
def discover_similar_books():
@@ -23,10 +24,12 @@ def discover_similar_books():
2324
# print(bags_of_words[0])
2425

2526
common_words_0 = most_common(0, bags_of_words, stemmed)
26-
print(common_words_0)
27+
# print(common_words_0)
2728

2829
books_similarities = tf_idf(bags_of_words, titles)
29-
print(books_similarities)
30+
# print(books_similarities)
31+
32+
show_similaryty_chart(books_similarities, 'CoralReefs')
3033

3134

3235
if __name__ == '__main__':
+11
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
import matplotlib.pyplot as plt
2+
3+
4+
def show_similaryty_chart(df, title):
5+
values = df[title]
6+
values_sorted = values.sort_values()
7+
similarity_chart = values_sorted.plot(kind='barh')
8+
similarity_chart.set_title('Similarity Score')
9+
similarity_chart.set_xlabel('Similarities')
10+
similarity_chart.set_ylabel('Titles')
11+
plt.savefig(title + '_similarities.pdf')

0 commit comments

Comments
 (0)