Commit
·
42428e3
1
Parent(s):
a3e15e0
Partial token sort matching
Browse files
core.py
CHANGED
@@ -189,7 +189,7 @@ def drop_non_numerical_columns(df):
|
|
189 |
def output_list(input_dict, movies_df = movie_embeds, tree = btree, user_embeddings = user_embeds, movies = final_movies):
|
190 |
movie_ratings = {}
|
191 |
for movie_title in input_dict:
|
192 |
-
matching_title = process.extractOne(movie_title, final_movies['title'].values, scorer=fuzz.
|
193 |
index = movies.index[movies['title'] == matching_title].tolist()[0]
|
194 |
movie_ratings[index] = input_dict[movie_title]
|
195 |
user_embed = create_user_embedding(movie_ratings, movie_embeds)
|
|
|
189 |
def output_list(input_dict, movies_df = movie_embeds, tree = btree, user_embeddings = user_embeds, movies = final_movies):
|
190 |
movie_ratings = {}
|
191 |
for movie_title in input_dict:
|
192 |
+
matching_title = process.extractOne(movie_title, final_movies['title'].values, scorer=fuzz.partial_token_sort_ratio)[0]
|
193 |
index = movies.index[movies['title'] == matching_title].tolist()[0]
|
194 |
movie_ratings[index] = input_dict[movie_title]
|
195 |
user_embed = create_user_embedding(movie_ratings, movie_embeds)
|