CornellNLP · Benja1958 · Mar 17, 2025 · Mar 19, 2025 · Mar 19, 2025 · Mar 19, 2025
diff --git a/.gitignore b/.gitignore
@@ -3,6 +3,8 @@ env/
 Docker/__pycache__
 
 venv/
+project-venv/
+test-env/
 
 *.pyc
 __pycache__/
@@ -17,4 +19,6 @@ dist/
 build/
 *.egg-info/
 helpers/*
-json_template/
+json_template/
+
+.history
diff --git a/backend/.coveragerc b/backend/.coveragerc
@@ -0,0 +1,12 @@
+# .coveragerc
+[run]
+branch = True
+source = backend
+
+[report]
+omit =
+    */__init__.py
+    */tests/*
+    */config.py
+show_missing = True
+skip_covered = True
diff --git a/backend/__init__.py b/backend/__init__.py
diff --git a/backend/app.py b/backend/app.py
@@ -1,46 +1,70 @@
 import json
 import os
-from flask import Flask, render_template, request
-from flask_cors import CORS
-from helpers.MySQLDatabaseHandler import MySQLDatabaseHandler
 import pandas as pd
+from flask import Flask, render_template, request,jsonify
+from flask_cors import CORS
 
-# ROOT_PATH for linking with all your files. 
-# Feel free to use a config.py or settings.py with a global export variable
-os.environ['ROOT_PATH'] = os.path.abspath(os.path.join("..",os.curdir))
-
-# Get the directory of the current script
-current_directory = os.path.dirname(os.path.abspath(__file__))
-
-# Specify the path to the JSON file relative to the current script
-json_file_path = os.path.join(current_directory, 'init.json')
-
-# Assuming your JSON data is stored in a file named 'init.json'
-with open(json_file_path, 'r') as file:
-    data = json.load(file)
-    episodes_df = pd.DataFrame(data['episodes'])
-    reviews_df = pd.DataFrame(data['reviews'])
+from .processing import Processor
+from .dataset import Dataset
 
 app = Flask(__name__)
 CORS(app)
 
-# Sample search using json with pandas
-def json_search(query):
-    matches = []
-    merged_df = pd.merge(episodes_df, reviews_df, left_on='id', right_on='id', how='inner')
-    matches = merged_df[merged_df['title'].str.lower().str.contains(query.lower())]
-    matches_filtered = matches[['title', 'descr', 'imdb_rating']]
-    matches_filtered_json = matches_filtered.to_json(orient='records')
-    return matches_filtered_json
+processor = Processor()
 
 @app.route("/")
 def home():
     return render_template('base.html',title="sample html")
 
-@app.route("/episodes")
-def episodes_search():
-    text = request.args.get("title")
-    return json_search(text)
+@app.route("/getbooks", methods=["POST"])
+def books_search():
+    user_input = request.get_json()
+    books = processor.get_recommended_books(user_input)
+    result_json = jsonify(books)
+    return result_json
+
+# @app.route("/titles")
+# def get_title_suggestions():
+#     query = request.args.get("q", "").lower()
+
+#     suggestions = []
+#     for title in processor.books.keys():
+#         if query in title.lower():
+#             suggestions.append(title)
+
+#     return jsonify(suggestions[:10])
+
+# @app.route("/authors")
+# def get_author_suggestions():
+#     query = request.args.get("q", "").lower()
+#     seen = set()
+#     suggestions = []
+
+#     for book_list in processor.books.values():
+#         for book in book_list:
+#             for author in book.get("authors", []):
+#                 author_lower = author.lower()
+#                 if query in author_lower and author_lower not in seen:
+#                     suggestions.append(author)
+#                     seen.add(author_lower)
+
+#     return jsonify(suggestions[:10])
+
+@app.route("/categories")
+def get_category_suggestions():
+    query = request.args.get("q", "").lower()
+    seen = set()
+    suggestions = []
+
+    for book_list in processor.books.values():
+        for book in book_list:
+            for category in book.get("categories", []):
+                category_lower = category.lower()
+                if query in category_lower and category_lower not in seen:
+                    suggestions.append(category)
+                    seen.add(category_lower)
+
+    return jsonify(suggestions[:5])
 
 if 'DB_NAME' not in os.environ:
-    app.run(debug=True,host="0.0.0.0",port=5000)
+    app.run(debug=True,host="0.0.0.0",port=5001)
diff --git a/backend/config.py b/backend/config.py
@@ -0,0 +1,4 @@
+import os
+
+ROOT_PATH = os.path.abspath(os.path.dirname(__file__))
+DEFAULT_BOOKS_JSON_FILE = os.path.join(ROOT_PATH,'data', 'popular_books.json')
diff --git a/backend/constants.py b/backend/constants.py
@@ -0,0 +1,25 @@
+from types import SimpleNamespace
+
+# Database Book Record Keys
+CATEGORY_KEY = "categories"
+AUTHOR_KEY = "authors"
+SCORE_KEY = "score"
+DESCRIPTION_KEY = "description"
+
+NOT_AVAILABLE = "NOT AVAILABLE"
+
+# Frontend Input Keys
+INPUT_TITLES_KEY = "titles"
+INPUT_AUTHORS_KEY = "authors"
+INPUT_CATEGORIES_KEY = "categories"
+
+DEFAULT_RECS_WEIGHTS = SimpleNamespace(
+    TITLES =  0.6, 
+    AUTHORS = 0.3, 
+    CATEGORIES =  0.1
+)
+
+DEFAULT_RECS_SIZE = 20
+
+# Processor Constants
+NUM_LATENT_SEMANTIC_CONCEPTS = 100