diff --git a/datat.ipynb b/datat.ipynb index 9d37ac0..c447af2 100644 --- a/datat.ipynb +++ b/datat.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 13, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ @@ -23,7 +23,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -34,7 +34,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -44,12 +44,13 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "test_mat = tf_vectorizer.transform(df_akk['Text'].dropna().to_list())\n", - "cc = cosine_similarity(save_vect,save_vect)\n" + "cc = cosine_similarity(save_vect,save_vect)\n", + "bool_similarity = cc > 0.5\n" ] }, {