RubyGems - ai_chatbot - Versions diffs - 0.1.6.4 → 0.1.6.5.1 - Mend

ai_chatbot 0.1.6.4 → 0.1.6.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 802b2da58aa8ef78b7b9813faf48e789db953d4c6e62a437002b1dc6017e4167
-  data.tar.gz: b3525c33bd0965aeccc2b13d67380e67df0ec6f3c502b0afe24968d694833d0f
+  metadata.gz: fee6347bdac6070db1bfbc1711f039103c1237c149f42a7f0b848b85eba98314
+  data.tar.gz: c54c29b235f159921d4b33ac36bc56d505983eb03a25500829d72e9741628983
 SHA512:
-  metadata.gz: eff5b8d9885206a83a4f6a05ca275c925717299360ae62df2af451009a07e5d244de503031d0f8a091a4cd1ef067af85a18cadf6ded9ef994899b6d5639e4747
-  data.tar.gz: b05cd753b9e3d4db2d9e6fb86aa43b2e0e355d8cf723e3d852bfb43a23897aade4d5849232179c7338babc0f19568d05d5c5eafdda781337d00daca83b6594fc
+  metadata.gz: f80cec458575b77b6be9879007e3f60830886b88bcfbde28974e9fe1e68b59d61424956a0aea0db62e69e5705e2c8d2b2b97d3e6700ee3b9cdd141530816325f
+  data.tar.gz: d2ac4f47ef9ce02255a60e84a6bff019c9036be5368f79e43748ca945a459c4459c5b53ee7a57a8345114018e03d0f5a1eeab70895ac78bafefed6980223dc59

data/lib/ai_chatbot/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 # frozen_string_literal: true
 module AiChatbot
-  VERSION = "0.1.6.4"
+  VERSION = "0.1.6.5.1"
 end

data/lib/ml_model.py CHANGED Viewed

@@ -1,162 +1,142 @@
 import sys
+import psycopg2
+import os
+from dotenv import load_dotenv
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sklearn.naive_bayes import MultinomialNB
 from sklearn.pipeline import make_pipeline
 from sklearn.metrics.pairwise import cosine_similarity
-import pickle
-import os
-# Cache to store previously asked questions
-cache = {}
-# Load or initialize the dataset
-if os.path.exists("qa_model.pkl"):
-    with open("qa_model.pkl", "rb") as f:
-        model_data = pickle.load(f)
-        questions = model_data.get("questions", [])
-        answers = model_data.get("answers", [])
-else:
-    questions = [
-        "How to create a new model in Rails?",
-        "What is migration?",
-        "How to add a route?"
-    ]
-    answers = [
-        "You can create a model using 'rails generate model'.",
-        "Migration is a database schema change.",
-        "You can add a route in the config/routes.rb file."
-    ]
-# Create a pipeline (TF-IDF + MultinomialNB)
-model = make_pipeline(TfidfVectorizer(), MultinomialNB())
-model.fit(questions, answers)
-# Populate cache with known questions and answers
-for q, a in zip(questions, answers):
-    cache[q.lower()] = a
-# Function to predict or retrain the model
-def main(action, query=None, new_answer=None):
-    if action == "predict":
-        return get_prediction(query)
-    elif action == "train_model":
-        return train_model(query, new_answer)
-    elif action == "update_answer":
-        return update_answer(query, new_answer)
-    elif action == "update_or_delete_question":
-        return update_or_delete_question(query, new_answer)
-    elif action == "list_questions":
-        return list_questions()
-    elif action == "list_answers":
-        return list_answers()
+# Load environment variables
+load_dotenv()
-# Function to predict the response with caching
-def get_prediction(query):
-    query_lower = query.lower()
+# Connect to PostgreSQL
+conn = psycopg2.connect(
+    dbname=os.getenv("DB_NAME"),
+    user=os.getenv("DB_USERNAME"),
+    password=os.getenv("DB_PASSWORD"),
+    host=os.getenv("DB_HOST"),
+    port=os.getenv("DB_PORT"),
+)
+cursor = conn.cursor()
+# Fetch data from DB
+cursor.execute("SELECT question, answer FROM qa_data")
+rows = cursor.fetchall()
+questions = [row[0] for row in rows]
+answers = [row[1] for row in rows]
-    # **Check cache first**
-    if query_lower in cache:
-        return cache[query_lower]
+# Define the vectorizer and Naive Bayes model
+vectorizer = TfidfVectorizer()
+model = MultinomialNB()
+pipeline = make_pipeline(vectorizer, model)
-    query_vec = model.named_steps['tfidfvectorizer'].transform([query])
-    question_vecs = model.named_steps['tfidfvectorizer'].transform(questions)
+# Train model if there is data
+if questions:
+    pipeline.fit(questions, answers)
-    # Calculate cosine similarity
-    similarities = cosine_similarity(query_vec, question_vecs)
-    max_similarity = similarities.max()
+def get_prediction(query):
+    if not questions:
+        return "No questions available in the database."
+    query_vec = vectorizer.transform([query])
+    similarities = cosine_similarity(query_vec, vectorizer.transform(questions)).flatten()
+    max_sim_index = similarities.argmax()
+    max_similarity = similarities[max_sim_index]
     threshold = 0.65
     if max_similarity < threshold:
         return "No good match found. Please provide the correct answer."
     else:
-        prediction = model.predict([query])[0]
-        # **Store in cache for faster future retrieval**
-        cache[query_lower] = prediction
-        return prediction
-# Function to train the model with a new question and answer
+        return answers[max_sim_index]
+# Function to train the model with new data
 def train_model(new_question, new_answer):
     global questions, answers
-    # Append new question-answer pair
+    # Store in database
+    cursor.execute(
+        "INSERT INTO qa_data (question, answer, created_at, updated_at) VALUES (%s, %s, NOW(), NOW()) ON CONFLICT (question) DO NOTHING",
+        (new_question, new_answer),
+    )
+    conn.commit()
+    # Update lists and retrain model
     questions.append(new_question)
     answers.append(new_answer)
+    pipeline.fit(questions, answers)  # Retrain model
-    # Retrain the model
-    model.fit(questions, answers)
-    # **Update cache**
-    cache[new_question.lower()] = new_answer
+    return f"Added: '{new_question}' -> '{new_answer}'"
-    # Save the updated model
-    with open("qa_model.pkl", "wb") as f:
-        pickle.dump({"questions": questions, "answers": answers}, f)
-    return f"Model retrained with: '{new_question}' -> '{new_answer}'"
 # Function to update an answer
 def update_answer(existing_question, new_answer):
-    global questions, answers
-    if existing_question in questions:
-        index = questions.index(existing_question)
-        answers[index] = new_answer
-        # Retrain the model
-        model.fit(questions, answers)
+    if existing_question not in questions:
+        return f"Question '{existing_question}' not found."
-        # **Update cache**
-        cache[existing_question.lower()] = new_answer
+    cursor.execute(
+        "UPDATE qa_data SET answer = %s WHERE question = %s", (new_answer, existing_question)
+    )
+    conn.commit()
-        # Save the model
-        with open("qa_model.pkl", "wb") as f:
-            pickle.dump({"questions": questions, "answers": answers}, f)
-        return f"Answer updated for: '{existing_question}'"
-    return "Question not found."
-# Function to update or delete a question
-def update_or_delete_question(existing_question, new_question):
-    global questions, answers
+    # Update lists and retrain model
+    index = questions.index(existing_question)
+    answers[index] = new_answer
+    pipeline.fit(questions, answers)
-    if existing_question in questions:
-        index = questions.index(existing_question)
+    return f"Updated: '{existing_question}' -> '{new_answer}'"
-        if new_question:
-            questions[index] = new_question
-            # **Update cache**
-            cache[new_question.lower()] = answers[index]
-        else:
-            # Delete the question
-            del questions[index]
-            del answers[index]
-        # Retrain the model
-        model.fit(questions, answers)
+# Function to delete a question
+def delete_question(existing_question):
+    if existing_question not in questions:
+        return f"Question '{existing_question}' not found."
-        # **Remove from cache if deleted**
-        if not new_question:
-            cache.pop(existing_question.lower(), None)
+    cursor.execute("DELETE FROM qa_data WHERE question = %s", (existing_question,))
+    conn.commit()
-        # Save the model
-        with open("qa_model.pkl", "wb") as f:
-            pickle.dump({"questions": questions, "answers": answers}, f)
+    index = questions.index(existing_question)
+    del questions[index]
+    del answers[index]
+    pipeline.fit(questions, answers)
-        return f"Updated question: '{existing_question}' -> '{new_question}'" if new_question else f"Deleted: '{existing_question}'"
+    return f"Deleted: '{existing_question}'"
-    return "Question not found."
+# Function to list questions
 def list_questions():
-    return questions
+    cursor.execute("SELECT question FROM qa_data")
+    return [row[0] for row in cursor.fetchall()]
+# Function to list answers
 def list_answers():
-    return answers
+    cursor.execute("SELECT answer FROM qa_data")
+    return [row[0] for row in cursor.fetchall()]
+# Command-line execution
 if __name__ == "__main__":
     action = sys.argv[1]
     question = sys.argv[2] if len(sys.argv) > 2 else None
     answer = sys.argv[3] if len(sys.argv) > 3 else None
-    print(main(action, question, answer))
+    if action == "predict":
+        print(get_prediction(question))
+    elif action == "train_model":
+        print(train_model(question, answer))
+    elif action == "update_answer":
+        print(update_answer(question, answer))
+    elif action == "delete_question":
+        print(delete_question(question))
+    elif action == "list_questions":
+        print(list_questions())
+    elif action == "list_answers":
+        print(list_answers())
+# Close DB connection
+cursor.close()
+conn.close()

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: ai_chatbot
 version: !ruby/object:Gem::Version
-  version: 0.1.6.4
+  version: 0.1.6.5.1
 platform: ruby
 authors:
 - Sanket
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2025-02-26 00:00:00.000000000 Z
+date: 2025-03-05 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: open3
@@ -24,8 +24,8 @@ dependencies:
     - - ">="
       - !ruby/object:Gem::Version
         version: '0'
-description: Integrates a chatbot using Python for predictions and training in a Rails
-  application.
+description: Added PostgreSQL support, fixed model error. Version 0.1.6.5.1 Details
+  on Git.
 email:
 - sanket.tikhande@gmail.com
 executables: []
@@ -58,5 +58,5 @@ requirements: []
 rubygems_version: 3.3.7
 signing_key:
 specification_version: 4
-summary: 'Fix: Improved response caching in ChatbotService'
+summary: 'Fix: Added postgres integration'
 test_files: []