redis
diff --git a/‎Dockerfile
Lines changed: 12 additions & 0 deletions b/‎Dockerfile
Lines changed: 12 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 51 additions & 1 deletion b/‎README.md
Lines changed: 51 additions & 1 deletion
diff --git a/‎imdb_movies.csv
Lines changed: 10179 additions & 0 deletions b/‎imdb_movies.csv
Lines changed: 10179 additions & 0 deletions
diff --git a/‎initialize.py
Lines changed: 91 additions & 0 deletions b/‎initialize.py
Lines changed: 91 additions & 0 deletions
diff --git a/‎requirements.txt
Lines changed: 24 additions & 0 deletions b/‎requirements.txt
Lines changed: 24 additions & 0 deletions
diff --git a/‎src/.DS_Store
6 KB b/‎src/.DS_Store
6 KB
diff --git a/‎src/__init__.py b/‎src/__init__.py
diff --git a/‎src/_version.py
Lines changed: 1 addition & 0 deletions b/‎src/_version.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/apis/__init__.py
Lines changed: 23 additions & 0 deletions b/‎src/apis/__init__.py
Lines changed: 23 additions & 0 deletions
diff --git a/‎src/apis/service.py
Lines changed: 100 additions & 0 deletions b/‎src/apis/service.py
Lines changed: 100 additions & 0 deletions
@@ -0,0 +1,12 @@
+FROM docker.io/python:3.9
+WORKDIR /app
+COPY src /app/src/
+COPY requirements.txt wsgi.py /app
+
+RUN pip install --no-cache-dir -r requirements.txt
+
+ENV GUNICORN_CMD_ARGS="--workers 1 --bind 0.0.0.0:8000 --timeout 600 --log-level debug --capture-output --error-logfile ./gunicorn.log"
+ENV PYTHONUNBUFFERED=1
+EXPOSE 8000
+
+CMD [ "gunicorn", "wsgi:create_app()" ]
@@ -1 +1,51 @@
-# MiniPilot
+# MiniPilot
+
+This application implements a chatbot you can train with your data. The example provided is a movie recommender system.
+
+![demo](src/static/images/minipilot.gif)
+
+The system uses:
+
+- Redis Stack as a Vector Database to store the dataset and vectorize the entries to perform [Vector Similarity Search (VSS)](https://redis.io/docs/latest/develop/interact/search-and-query/advanced-concepts/vectors/) for RAG
+- The [IMDB movies dataset](https://www.kaggle.com/datasets/ashpalsingh1525/imdb-movies-dataset), which contains 10000+ movies from the IMDB Movies dataset
+- OpenAI ChatGPT Large Language Model (LLM) [ChatCompletion API](https://platform.openai.com/docs/guides/gpt/chat-completions-api)
+
+## setup
+
+Clone the repository 
+
+```commandline
+git clone https://github.com/mortensi/MiniPilot.git
+```
+
+Make sure you have an [OpenAI token](https://openai.com/api/pricing/), then install the requirements
+
+```commandline
+pip install -r requirements.txt
+```
+
+Then set the environment variables in a `.env` file.
+
+```commandline
+DB_SERVICE="127.0.0.1"
+DB_PORT=6379
+DB_PWD=""
+
+MINIPILOT_DEBUG = "True"
+MINIPILOT_MODEL="gpt-3.5-turbo-16k"
+
+OPENAI_API_KEY="your-openai-key"
+```
+
+You can also use the `export` command.
+
+```commandline
+export DB_SERVICE="127.0.0.1" DB_PORT=6379 DB_PWD="" MINIPILOT_DEBUG = "True" MINIPILOT_MODEL="gpt-3.5-turbo-16k" OPENAI_API_KEY="your-openai-key"
+```
+
+Start the server `./start.sh`
+
+Load the data with `python3 initialize.sh`
+
+Point your browsert to `http://127.0.0.1:5005/` and start asking.
+
@@ -0,0 +1,91 @@
+import csv
+import os
+from datetime import datetime
+import logging
+
+import redis
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain_community.embeddings import OpenAIEmbeddings
+from langchain_community.vectorstores.redis import Redis
+
+
+def generate_redis_connection_string():
+    if os.getenv('DB_PWD', ''):
+        connection_string = f"redis://:{os.getenv('DB_PWD', '')}@{os.getenv('DB_SERVICE', '127.0.0.1')}:{int(os.getenv('DB_PORT', 6379))}"
+    else:
+        connection_string = f"redis://{os.getenv('DB_SERVICE', '127.0.0.1')}:{int(os.getenv('DB_PORT', 6379))}"
+
+    return connection_string
+
+
+def load():
+    conn = redis.from_url(generate_redis_connection_string())
+
+    # Create a new index
+    index_name = f"minipilot_rag_{datetime.now().strftime('%Y_%m_%d_%H_%M_%S')}_idx"
+
+    index_schema = {
+        "tag": [{"name": "genre"},
+                {"name": "country"}],
+        "text": [{"name": "names"}],
+        "numeric": [{"name": "revenue"},
+                    {"name": "score"},
+                    {"name": "date_x"}]
+    }
+
+    vector_schema = {
+        "algorithm": "HNSW"
+    }
+
+    # If there is no index for RAG, this is the first index; then, manually point an alias to it
+    try:
+        conn.ft('convai_rag_alias').info()
+    except redis.exceptions.ResponseError as e:
+        logging.warning(f"No alias exists for semantic search. Create the alias when indexing is done")
+
+    # Validate there is an OPENAI_API_KEY passed in the environment
+    try:
+        embedding_model = OpenAIEmbeddings()
+    except Exception as e:
+        logging.error(e)
+        return
+
+    doc_splitter = RecursiveCharacterTextSplitter(  chunk_size=10000,
+                                                    chunk_overlap=50,
+                                                    length_function=len,
+                                                    add_start_index=True
+                                                    )
+
+    with open("imdb_movies.csv", encoding='utf-8') as csvf:
+        csvReader = csv.DictReader(csvf)
+        cnt = 0
+        for row in csvReader:
+            movie = f"movie title is: {row['names']}\n"
+            movie += f"movie genre is: {row['genre']}\n"
+            movie += f"movie crew is: {row['crew']}\n"
+            movie += f"movie score is: {row['score']}\n"
+            movie += f"movie overview is: {row['overview']}\n"
+            movie += f"movie country is: {row['country']}\n"
+            movie += f"movie revenue is: {row['revenue']}\n"
+
+
+            cnt += 1
+            splits = doc_splitter.split_text(row['overview'])
+            unix_timestamp = int(datetime.strptime(row['date_x'].strip(), "%m/%d/%Y").timestamp())
+            metadatas = {"names": row['names'],
+                         "genre": row['genre'],
+                         "country": row['country'],
+                         "revenue": row['revenue'],
+                         "score": row['score'],
+                         "date_x": unix_timestamp}
+
+            if len(splits) > 0:
+                Redis.from_texts(texts=splits,
+                                 metadatas=[metadatas] * len(splits),
+                                 embedding=embedding_model,
+                                 index_name=index_name,
+                                 index_schema=index_schema,
+                                 vector_schema=vector_schema,
+                                 redis_url=generate_redis_connection_string())
+
+load()
@@ -0,0 +1,24 @@
+beautifulsoup4==4.12.3
+Flask==3.0.1
+flask_cors==4.0.0
+flask_paginate==2023.10.24
+flask-restx==1.3.0
+flask_session==0.6.0
+gunicorn==21.2.0
+langchain==0.1.4
+langchain_community==0.0.16
+langchain_core==0.1.17
+openai==1.10.0
+python-dotenv==1.0.1
+redis==5.0.1
+redisvl==0.0.7
+Requests==2.31.0
+scrapy==2.11.0
+spacy==3.7.4
+spacy-legacy==3.0.12
+tiktoken==0.5.2
+WTForms==3.1.2
+wtforms_json==0.3.5
+sentence-transformers==2.3.0
+tenacity==8.2.2
+validators==0.22.0
@@ -0,0 +1 @@
+__version__ = 0.9.0
@@ -0,0 +1,23 @@
+from flask_restx import Api
+
+from .service import api as ns_service
+
+authorizations = {
+    'api_key': {
+        'type': 'apiKey',
+        'in': 'header',
+        'name': 'admin-token'
+    }
+}
+
+api = Api(
+    title='Minipilot Server REST API',
+    version='1.0',
+    description='Welcome to the Minipilot Server REST API. Use this API to train your GenAI chatbot with online docs',
+    doc='/api',
+    prefix='/api',
+    authorizations=authorizations,
+    security='api_key'
+)
+
+api.add_namespace(ns_service)
@@ -0,0 +1,100 @@
+import urllib
+
+from flask import request, jsonify, Response
+from flask_paginate import Pagination
+from flask_restx import Resource, Namespace, reqparse, inputs
+from langchain_community.chat_message_histories import RedisChatMessageHistory
+from redis.commands.search.query import Query
+
+from src.apis.validation import rate_limiter
+from src.common.config import MINIPILOT_SEARCH_RESULTS, REDIS_CFG, MINIPILOT_HISTORY_TIMEOUT
+from src.common.utils import get_db, parse_query_string, extract_keywords, generate_redis_connection_string, \
+    history_to_json
+from src.core.RedisRetrievalChain import RedisRetrievalChain
+
+api = Namespace('Services', path="/", description='Chat and search services')
+
+
+def min_length(min_len):
+    def validate(s):
+        if len(s) < min_len:
+            raise ValueError(f'Minimum length is {min_len}')
+        return s
+    return validate
+
+
+def validate_length(min_len, max_len):
+    def validate(s):
+        if len(s) < min_len:
+            raise ValueError(f'Minimum length is {min_len}')
+        if len(s) > max_len:
+            raise ValueError(f'Maximum length is {max_len}')
+        return s
+    return validate
+
+
+@api.route('/history')
+class ChatHistory(Resource):
+    @api.doc(params={'session-id': {'in': 'header', 'description': 'session-id'}})
+    @api.doc(description='Get user conversation history', consumes=['application/json'])
+    def get(self):
+        """Get user conversation history"""
+        session_id = str(request.headers.get("session-id"))
+        redis_history = RedisChatMessageHistory(url=generate_redis_connection_string(REDIS_CFG["host"], REDIS_CFG["port"], REDIS_CFG["password"]),
+                                                session_id=session_id,
+                                                key_prefix='minipilot:history:',
+                                                ttl=MINIPILOT_HISTORY_TIMEOUT)
+        return history_to_json(redis_history.messages), 200
+
+
+@api.route('/reset')
+class ChatHistoryReset(Resource):
+    @api.doc(params={'session-id': {'in': 'header', 'description': 'session-id'}})
+    @api.doc(description='Reset user conversation history', consumes=['application/json'])
+    def post(self):
+        """Reset user conversation history"""
+        session_id = str(request.headers.get("session-id"))
+        engine = RedisRetrievalChain(session_id)
+        engine.reset_history()
+        return {"response": "Conversation restarted"}, 200
+
+
+@api.route('/chat')
+class Chat(Resource):
+    service_query_parser = reqparse.RequestParser()
+    service_query_parser.add_argument('q', type=validate_length(4, 500), required=True, help='Chat query', location='args')
+
+    @api.expect(service_query_parser)
+    @api.doc(params={'session-id': {'in': 'header', 'description': 'session-id'}})
+    @rate_limiter(request)
+    @api.doc(description='Ask a question in natural language: will answer, post the answer to the history and semantic cache', consumes=['application/json'])
+    def post(self):
+        """Ask a question in natural language: will answer, post the answer to the history and semantic cache"""
+        args = self.service_query_parser.parse_args(req=request)
+        session_id = str(request.headers.get("session-id"))
+
+        engine = RedisRetrievalChain(session_id)
+        engine.ask(args['q'])
+        return Response(engine.streamer(), content_type="text/event-stream", headers={'X-Accel-Buffering': 'no'})
+
+
+@api.route('/references')
+class SearchReferences(Resource):
+    service_query_parser = reqparse.RequestParser()
+    service_query_parser.add_argument('q', type=str, required=True, help='References query', location='args')
+
+    @api.expect(service_query_parser)
+    @api.doc(description='Semantic references from a natural language query', consumes=['application/json'])
+    def get(self):
+        """Semantic references from a natural language query"""
+        args = self.service_query_parser.parse_args(req=request)
+        # This method is session-less, just performs vector search, we reuse the RedisRetrievalChain utility, though
+        # And indicate a fake session id TODO clean up and use a new session-less constructor, or RedisVL
+        session_id = "xxxxxxx"
+        engine = RedisRetrievalChain(session_id)
+        references = engine.references(urllib.parse.unquote(args['q']))
+        return references, 200
+
+
+
+