aboutsummaryrefslogtreecommitdiff
path: root/db2pc.py
blob: f0d6ba94276edf4e2aebacdff471c00e00ec9c43 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
from database import *
import pandas as pd

from sentence_transformers import SentenceTransformer

database_url = "sqlite:///jlm.db"

engine, Session = init_db_stuff(database_url)

model = SentenceTransformer("paraphrase-multilingual-MiniLM-L12-v2")

df = pd.read_sql("Select * from movies", engine)
df["combined_text"] = df["title"] + ": " + df["overview"].fillna('') + " -  " + df["tagline"].fillna('') + " Genres:-  " + df["genres"].fillna('')

print(len(df["combined_text"].tolist()))