change filter option

......@@ -89,7 +89,7 @@ def main():
tfidf_matrix_file_name = 'tfidf_matrix.npz'
if tfidf_matrix_file_name not in os.listdir('./') or csv_file_name not in os.listdir('./'):
paper_ids, titles, abstracts, bodies = get_all_data(filter_non_english=False)
paper_ids, titles, abstracts, bodies = get_all_data(filter_non_english=True)
tfidf_matrix = get_tfidf_matrix([a + " " + b for a, b in zip(abstracts, bodies)])
# save important data for future runs
with open(csv_file_name, 'w', encoding='utf-8') as f:
