Spaces:

AntonyG
/

v0_movie_recommender_system

Sleeping

App Files Files Community

v0_movie_recommender_system / app.py

AntonyG

updated app with movies names and genre

5f98259 verified 10 months ago

raw

history blame contribute delete

3.36 kB

	import gradio as gr
	import pickle
	import numpy as np
	import pandas as pd

	# model weights pickled after training from scratch
	with open('final_02_model_biases_factors.pkl', 'rb') as file:
	model_state = pickle.load(file)

	user_bias = model_state["user_bias"]
	movie_bias = model_state["movie_bias"]
	user_factors = model_state["user_factors"]
	movie_factors = model_state["movie_factors"]
	movies = pd.read_csv("movies.csv")

	with open('map_movie_to_idx.pkl', 'rb') as file:
	map_movie_to_idx = pickle.load(file)

	with open('map_idx_to_movie.pkl', 'rb') as file:
	map_idx_to_movie = pickle.load(file)

	def get_movie_id(title):
	movie = movies[movies['title'].str.contains(title, case=False, na=False)]
	if not movie.empty:
	return movie.iloc[0]['movieId'], movie.iloc[0]['title'], movie.iloc[0]['genres']
	return None, None, None

	def recommend_movies(movie_title, rating, latent_dim=10, lambda_param=0.1, tau=0.1):
	movie_id, title, genres = get_movie_id(movie_title)
	if movie_id is None:
	return f"Movie '{movie_title}' not found."

	# Map the dummy movie id to its index
	dummy_movie_index = map_movie_to_idx[movie_id]

	# Get the movie factors and bias for the dummy movie
	dummy_movie_factors = movie_factors[:, dummy_movie_index]
	dummy_movie_bias = movie_bias[dummy_movie_index]

	# Initialize dummy user factors
	dummy_user_factors = np.zeros(latent_dim)

	# Calculate the dummy user factor
	dummy_user_factor = np.linalg.inv(lambda_param * np.outer(dummy_movie_factors, dummy_movie_factors) +
	tau * np.eye(latent_dim)) @ (lambda_param * dummy_movie_factors * (rating - dummy_movie_bias))

	# Calculate the score for each movie
	score = dummy_user_factor @ movie_factors + 0.05 * movie_bias

	# Get the top 10 recommendations
	recommend_movies_indices = np.argsort(score)[-10:]

	# Map the indices back to movie titles
	recommended_movies = [movies.loc[movies["movieId"] == map_idx_to_movie[movie]] for movie in recommend_movies_indices]

	# Format the output as HTML
	html_output = "<div style='font-family: Arial, sans-serif;'>"
	html_output += f"<div style='margin-bottom: 20px;'><strong>Selected Movie:</strong><br>Title: {title}<br>Genres: {genres}</div>"
	html_output += "<div style='margin-bottom: 20px;'><strong>Recommended Movies:</strong></div>"
	for i, movie in enumerate(recommended_movies):
	title = movie["title"].values[0]
	genres = movie["genres"].values[0]
	html_output += f"<div style='margin-bottom: 10px;'><strong>{i+1}. {title}</strong><br>Genres: {genres}</div>"
	html_output += "</div>"

	return html_output

	# Define the Gradio interface
	iface = gr.Interface(
	fn=recommend_movies,
	inputs=[
	gr.Textbox(label="Movie Title"),
	gr.Slider(0, 5, step=0.1, label="Rating")
	],
	outputs="html",
	title="Movie Recommendation System",
	description="""
	Enter a movie title and rating to get top 10 movie recommendations.
	I made this demo as part of a machine learning class taught by Prof. Ulich Paquet at AIMS South Africa.
	Here are some sample movies you can try out of a database of over 62,000 movies:
	- Toy Story
	- Incredibles
	- Lord of the rings
	- Star Wars
	- Terminator
	"""
	)

	iface.launch(share=True)