finished the interface

581ff39b · Paktalin · c1ae90b8 · 581ff39b · 581ff39b · 581ff39b
Commit 581ff39b authored Dec 21, 2018 by Paktalin
Showing with 25 additions and 12 deletions
__pycache__/plot_util.cpython-36.pyc
estnltk_preprocessing.py
main.py
pictures/cases_frequency.png
pictures/cases_pdf.png
pictures/g_ad.png
pictures/g_all.png
pictures/g_el.png
pictures/in_g.png
pictures/n_ad.png
pictures/n_adt.png
pictures/n_all.png
pictures/n_el.png
pictures/n_g.png
pictures/n_in.png
pictures/p_ad.png
pictures/p_adt.png
pictures/p_all.png
pictures/p_el.png
pictures/p_g.png
--- a/__pycache__/plot_util.cpython-36.pyc
+++ b/__pycache__/plot_util.cpython-36.pyc
--- a/estnltk_preprocessing.py
+++ b/estnltk_preprocessing.py
@@ -85,7 +85,9 @@ def construct_df_of_verbs(initial_df):
 	print(verbs_df)


-if __name__ == '__main__':
-	df = read_csv('cleaned_dataframe.csv', sep='~')
-	df.columns = ['distance', 'noun_like', 'noun_like_form', 'noun_like_pos', 'sentence', 'verb', 'verbs_form']
-	construct_df_of_verbs(df)
\ No newline at end of file
+# df = read_csv('cleaned_dataframe.csv', sep='~')
+# df.columns = ['distance', 'noun_like', 'noun_like_form', 'noun_like_pos', 'sentence', 'verb', 'verbs_form']
+# construct_df_of_verbs(df)
+
+df = read_csv('verbs.csv', sep='~', header=0)
+print(len(df.columns))
\ No newline at end of file
--- a/main.py
+++ b/main.py
@@ -33,13 +33,21 @@ def plot_results(X, R, forms, df):
 		print('Cluster', k)
 		print(df[R[:,k] == 1]['verb'])

-def print_verb_info(verb, df, X, R, forms):
-	current_verb_index = df[df['verb'] == verb].index
-	print_cluster(current_verb_index, df, X, R)
-	pie_chart_verb(X[current_verb_index][0].tolist(), forms.tolist(), verb)
-	print_sample_usages(verb)
+def print_verb_info(df, X, R, forms):
+	while(True):
+		verb = input('\nPlease, enter the verb. Or \'e\' to exit: ')
+		if verb == 'e':
+			break
+		elif len(df[df['verb'] == verb]) != 0:
+			current_verb_index = df[df['verb'] == verb].index
+			print_cluster(current_verb_index, df, X, R)
+			pie_chart_verb(X[current_verb_index][0].tolist(), forms.tolist(), verb)
+			print_sample_usages(verb)
+		else:
+			print('Sorry. The verb was not found')

 def print_cluster(current_verb_index, df, X, R):
+	print('\nSimilar verbs are:')
 	R_verb = R[current_verb_index][0]
 	k = np.where(R_verb == 1)[0][0]
 	similar_verbs = df[R[:,k] == 1]['verb']
@@ -50,6 +58,7 @@ def print_cluster(current_verb_index, df, X, R):
 	print(list(similar_verbs_dict.keys())[1:])

 def print_sample_usages(verb):
+	print('\nSample usages of the verb:')
 	df = read_csv('cleaned_dataframe.csv', sep='~')
 	df.columns = ['distance', 'noun_like', 'noun_like_form', 'noun_like_pos', 'sentence', 'verb', 'verbs_form']
 	sentences = df[df['verb'] == verb]['sentence'].tolist()
@@ -69,4 +78,4 @@ def print_sample_usages(verb):
 R = np.genfromtxt('R.csv', delimiter='~')
 M = np.genfromtxt('M.csv', delimiter='~')
 X, verbs, forms, df = get_verbs_data()
-print_verb_info('armastama', df, X, R, forms)
\ No newline at end of file
+print_verb_info(df, X, R, forms)
\ No newline at end of file
--- a/pictures/cases_frequency.png
+++ b/pictures/cases_frequency.png
--- a/pictures/cases_pdf.png
+++ b/pictures/cases_pdf.png
--- a/pictures/g_ad.png
+++ b/pictures/g_ad.png
--- a/pictures/g_all.png
+++ b/pictures/g_all.png
--- a/pictures/g_el.png
+++ b/pictures/g_el.png
--- a/pictures/in_g.png
+++ b/pictures/in_g.png
--- a/pictures/n_ad.png
+++ b/pictures/n_ad.png
--- a/pictures/n_adt.png
+++ b/pictures/n_adt.png
--- a/pictures/n_all.png
+++ b/pictures/n_all.png
--- a/pictures/n_el.png
+++ b/pictures/n_el.png
--- a/pictures/n_g.png
+++ b/pictures/n_g.png
--- a/pictures/n_in.png
+++ b/pictures/n_in.png
--- a/pictures/p_ad.png
+++ b/pictures/p_ad.png
--- a/pictures/p_adt.png
+++ b/pictures/p_adt.png
--- a/pictures/p_all.png
+++ b/pictures/p_all.png
--- a/pictures/p_el.png
+++ b/pictures/p_el.png
--- a/pictures/p_g.png
+++ b/pictures/p_g.png
--- a/pictures/p_kom.png
+++ b/pictures/p_kom.png
--- a/pictures/p_n.png
+++ b/pictures/p_n.png
--- a/pictures/pie_charts/0.png
+++ b/pictures/pie_charts/0.png
--- a/pictures/pie_charts/1.png
+++ b/pictures/pie_charts/1.png
--- a/pictures/pie_charts/2.png
+++ b/pictures/pie_charts/2.png
--- a/pictures/pie_charts/3.png
+++ b/pictures/pie_charts/3.png
--- a/pictures/pie_charts/4.png
+++ b/pictures/pie_charts/4.png
--- a/pictures/pie_charts/5.png
+++ b/pictures/pie_charts/5.png
--- a/pictures/pie_charts/6.png
+++ b/pictures/pie_charts/6.png
--- a/pictures/pie_charts/7.png
+++ b/pictures/pie_charts/7.png
--- a/pictures/pie_charts/8.png
+++ b/pictures/pie_charts/8.png
--- a/pictures/pie_charts/9.png
+++ b/pictures/pie_charts/9.png
--- a/pictures/unimportant1.png
+++ b/pictures/unimportant1.png
--- a/plot_util.py
+++ b/plot_util.py
@@ -26,6 +26,8 @@ def plot_form_pdf(X, forms):
 			ax = pd.DataFrame(x).plot.density(bw_method=0.1)
 		labels.append('%s - mean: %.4f std: %.4f' % (forms[i], x.mean(), np.std(x)))
 	plt.xlim(-0.01, 0.015)
+	plt.xlabel('Usages per sample')
+	plt.yticks([])
 	plt.legend(labels=labels)
 	plt.show()