From 98d3d5994fbd6c0296a7062836eb1359a8290920 Mon Sep 17 00:00:00 2001 From: 1kamma Date: Mon, 26 Jun 2023 23:21:34 +0300 Subject: [PATCH] boolean similarity --- datat.ipynb | 11 ++++++----- 1 file changed, 6 insertions(+), 5 deletions(-) diff --git a/datat.ipynb b/datat.ipynb index 9d37ac0..c447af2 100644 --- a/datat.ipynb +++ b/datat.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 13, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ @@ -23,7 +23,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -34,7 +34,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -44,12 +44,13 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "test_mat = tf_vectorizer.transform(df_akk['Text'].dropna().to_list())\n", - "cc = cosine_similarity(save_vect,save_vect)\n" + "cc = cosine_similarity(save_vect,save_vect)\n", + "bool_similarity = cc > 0.5\n" ] }, {