[CAI-185] Chatbot/docker compose with Redis and DynamoDB for local de…

…velopment (#1193) * feat(chatbot): session GSI * feat(chatbot): docker compose * fix(chatbot): dynamodb and redis for local development with docker compose * chore(chatbot):remove duplicate imports * chore(chatbot): linting * fix(chatbot):create index in docker * chore(chatbot): llamaindex index id * fix(chatbot): create vector index with all docs * chore(chatbot): terraform lint * fix(chatbot): terraform syntax * chore(chatbot): remove dynamodb options * chore(chatbot): from global to local secondary index * chore: remove old var * Update apps/chatbot/docker/compose.yaml Co-authored-by: marcobottaro <[email protected]> * chore: remove logs * fix(chatbot): compose vars * Update modules * Update config prompts * Update env example * redis admin port --------- Co-authored-by: marcobottaro <[email protected]> Co-authored-by: mdciri <[email protected]>
pagopa · Oct 21, 2024 · 22d370e · 22d370e
1 parent e6b7263
commit 22d370e
Show file tree

Hide file tree

Showing 17 changed files with 1,062 additions and 755 deletions.
diff --git a/apps/chatbot/.env.example b/apps/chatbot/.env.example
@@ -13,6 +13,7 @@ CHB_WEBSITE_URL=...
 CHB_REDIS_INDEX_NAME=...
 CHB_LLAMAINDEX_INDEX_ID=...
 CHB_DOCUMENTATION_DIR=...
+CHB_USE_PRESIDIO=...
 CHB_GOOGLE_API_KEY=...
 CHB_PROVIDER=...
 CHB_MODEL_ID=...
@@ -21,6 +22,7 @@ CHB_MODEL_MAXTOKENS=...
 CHB_EMBED_MODEL_ID=...
 CHB_ENGINE_SIMILARITY_TOPK=...
 CHB_ENGINE_SIMILARITY_CUTOFF=...
-CHB_ENGINE_USE_ASYNC=...
+CHB_ENGINE_USE_ASYNC=True
 CHB_ENGINE_USE_STREAMING=...
 CHB_QUERY_TABLE_PREFIX=chatbot-local
+CHB_DYNAMODB_URL=http://locahost:8080
diff --git a/apps/chatbot/config/prompts.yaml b/apps/chatbot/config/prompts.yaml
@@ -12,7 +12,6 @@ qa_prompt_str: |
     - the answer must be clear, non-redundant, and have not repeated sentences.
     - the answer must not include the query.
     - If your answer is based on this retrieved context, include a "Rif" section at the end of the response, listing the titles and filenames from the source nodes used. If no context is used, do not include a reference.
-    - the answer must be with the same language of the query.
   --------------------
   Output Examples:
     Query: Cos'è il nodo dei pagamenti?
@@ -38,7 +37,14 @@ qa_prompt_str: |
   --------------------
   Task:
     Given the query: {query_str}
-    Answer the query according to the `Chatbot Policy` listed above.
+    
+    Reply to the user following these two steps:
+    Step 1:
+      Pay great attention in detail on the query's language and determine if it is formulated in Italian, English, Spanish, French, German, Greek, Croatian, or Slovenian ('yes' or 'no').
+    Step 2:
+      If Step 1 returns 'yes': reply always in Italian, regardless of the input language, according to the `Chatbot Policy` listed above.
+      Otherwise: reply you cannot speak that language and ask for a new query written in an accepted language.
+
     Answer: 
 
 

diff --git a/apps/chatbot/docker/app.local.Dockerfile b/apps/chatbot/docker/app.local.Dockerfile
@@ -1,6 +1,10 @@
 FROM python:3.12.4-slim-bullseye
 ARG DEBIAN_FRONTEND=noninteractive
 
+RUN apt-get update && \
+  apt-get install -y \
+  curl
+
 ENV PYTHONPATH=/app
 
 RUN pip install --upgrade pip \
@@ -14,4 +18,4 @@ RUN poetry install
 
 COPY . .
 
-CMD ["fastapi", "dev", "src/app/main.py", "--port", "8080"]
+CMD ["fastapi", "dev", "src/app/main.py", "--port", "8080", "--host", "0.0.0.0"]
diff --git a/apps/chatbot/docker/compose.yaml b/apps/chatbot/docker/compose.yaml
@@ -0,0 +1,57 @@
+services:
+  api:
+    build:
+      context: ..
+      dockerfile: docker/app.local.Dockerfile
+    ports:
+      - "8080:8080"
+    volumes:
+      - ..:/app
+      - ./files/.aws:/root/.aws
+      - ../../nextjs-website/out:/app/build-devp/out
+    depends_on:
+      redis:
+        condition: service_started
+      dynamodb:
+        condition: service_started
+    networks:
+      - ntw
+
+  dynamodb:
+    image: amazon/dynamodb-local:2.5.2
+    environment:
+      - AWS_ACCESS_KEY_ID=dummy
+      - AWS_SECRET_ACCESS_KEY=dummy
+      - AWS_DEFAULT_REGION=local
+    ports:
+      - "8000:8000"
+    networks:
+      - ntw
+
+  redis:
+    image: redis/redis-stack:7.2.0-v13
+    ports:
+      - "6379:6379"
+      - "8001:8001"
+    networks:
+      - ntw
+
+  create_index:
+    build:
+      context: ..
+      dockerfile: docker/app.local.Dockerfile
+    ports:
+      - "8080:8080"
+    volumes:
+      - ..:/app
+      - ../../nextjs-website/out:/app/build-devp/out
+    command: "python src/modules/create_vector_index.py --params config/params.yaml"
+    tty: true
+    depends_on:
+      redis:
+        condition: service_started
+    networks:
+      - ntw
+
+networks:
+  ntw:
diff --git a/apps/chatbot/docker/docker-compose-up-api.sh b/apps/chatbot/docker/docker-compose-up-api.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+docker compose -f docker/compose.yaml -p chatbot up api
diff --git a/apps/chatbot/docker/docker-run-create-index.sh b/apps/chatbot/docker/docker-run-create-index.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+docker compose -f docker/compose.yaml -p chatbot up create_index
diff --git a/apps/chatbot/docker/docker-run-local-bash.sh b/apps/chatbot/docker/docker-run-local-bash.sh
@@ -0,0 +1,2 @@
+#!/bin/bash
+docker run -it --env-file ./.env fastapi-local bash
diff --git a/apps/chatbot/docker/files/.aws/config b/apps/chatbot/docker/files/.aws/config
@@ -0,0 +1,2 @@
+[profile default]
+region = eu-south-1
diff --git a/apps/chatbot/docker/files/.aws/credentials b/apps/chatbot/docker/files/.aws/credentials
@@ -0,0 +1,3 @@
+[default]
+aws_access_key_id = 123
+aws_secret_access_key = xyz
diff --git a/apps/chatbot/poetry.lock b/apps/chatbot/poetry.lock
diff --git a/apps/chatbot/pyproject.toml b/apps/chatbot/pyproject.toml
@@ -37,9 +37,10 @@ llama-index-llms-gemini = "^0.3.4"
 google-generativeai = "^0.5.2"
 llama-index-embeddings-gemini = "^0.2.0"
 llama-index-llms-bedrock-converse = "^0.3.0"
+chromedriver-py = "^129.0.6668.91"
 llama-index-postprocessor-presidio = "^0.2.0"
 
 
 [build-system]
 requires = ["poetry-core"]
-build-backend = "poetry.core.masonry.api"
+build-backend = "poetry.core.masonry.api"
diff --git a/apps/chatbot/src/app/main.py b/apps/chatbot/src/app/main.py
@@ -18,30 +18,30 @@
 
 params = yaml.safe_load(open("config/params.yaml", "r"))
 prompts = yaml.safe_load(open("config/prompts.yaml", "r"))
-chatbot = Chatbot(params, prompts)
-
 AWS_DEFAULT_REGION = os.getenv('CHB_AWS_DEFAULT_REGION', os.getenv('AWS_DEFAULT_REGION', None))
 
+chatbot = Chatbot(params, prompts)
+
 
 class Query(BaseModel):
   question: str
   queriedAt: str | None = None
 
-if (os.getenv('environment', 'dev') == 'local'):
-  profile_name='dummy'
-  endpoint_url='http://localhost:8000'
-  region_name = AWS_DEFAULT_REGION
-
 boto3_session = boto3.session.Session(
-  profile_name = locals().get('profile_name', None),
-  region_name=locals().get('region_name', None)
+  region_name=AWS_DEFAULT_REGION
 )
 
-dynamodb = boto3_session.resource(    
-  'dynamodb',
-  endpoint_url=locals().get('endpoint_url', None),
-  region_name=locals().get('region_name', None),
-)
+if (os.getenv('environment', 'dev') == 'local'):
+  dynamodb = boto3_session.resource(    
+    'dynamodb',
+    endpoint_url=os.getenv('CHB_DYNAMODB_URL', 'http://localhost:8000'),
+    region_name=AWS_DEFAULT_REGION
+  )
+else:
+  dynamodb = boto3_session.resource(    
+    'dynamodb',
+    region_name=AWS_DEFAULT_REGION
+  )
 
 table_queries = dynamodb.Table(
   f"{os.getenv('CHB_QUERY_TABLE_PREFIX', 'chatbot')}-queries"
@@ -160,12 +160,13 @@ async def sessions_fetching(
     raise HTTPException(status_code=422, detail=f"[sessions_fetching] userId: {userId}, error: {e}")
 
   # TODO: pagination
+  items = db_response.get('Items', [])
   result = {
-    "items": db_response['Items'],
+    "items": items,
     "page": 1,
     "pages": 1,
-    "size": len(db_response['Items']),
-    "total": len(db_response['Items']),
+    "size": len(items),
+    "total": len(items),
   }
   return result
 
@@ -214,20 +215,26 @@ async def queries_fetching(
     sessionId = last_session_id(userId)
 
   try:
-    # TODO: add userId filter
     db_response = table_queries.query(
-      KeyConditionExpression=Key("sessionId").eq(sessionId)
+      KeyConditionExpression=Key("sessionId").eq(sessionId) &
+        Key("id").eq(userId)
     )
   except (BotoCoreError, ClientError) as e:
     raise HTTPException(status_code=422, detail=f"[queries_fetching] sessionId: {sessionId}, error: {e}")
 
-  result = db_response['Items']
+  result = db_response.get('Items', [])
   return result
 
 
 def last_session_id(userId: str):
-  # TODO: retrieve last user session
-  return '1'
+  db_response = table_sessions.query(
+    IndexName='SessionsByCreatedAtIndex',
+    KeyConditionExpression=Key('userId').eq(userId),
+    ScanIndexForward=False,
+    Limit=1
+  )
+  items = db_response.get('Items', [])
+  return items[0] if items else None
 
 @app.patch("/queries/{id}")
 async def query_feedback (badAnswer: bool):

diff --git a/apps/chatbot/src/modules/chatbot.py b/apps/chatbot/src/modules/chatbot.py
@@ -16,10 +16,7 @@
 from src.modules.presidio import PresidioPII
 
 
-AWS_S3_BUCKET = os.getenv("CHB_AWS_S3_BUCKET")
-ITALIAN_THRESHOLD = 0.85
-NUM_MIN_WORDS_QUERY = 3
-NUM_MIN_REFERENCES = 1
+USE_PRESIDIO = True if os.getenv("CHB_USE_PRESIDIO", "True") == "True" else False
 RESPONSE_TYPE = Union[
     Response, StreamingResponse, AsyncStreamingResponse, PydanticResponse
 ]
@@ -36,7 +33,9 @@ def __init__(
 
         self.params = params
         self.prompts = prompts
-        self.pii = PresidioPII(config=params["config_presidio"])
+        if USE_PRESIDIO:
+            self.pii = PresidioPII(config=params["config_presidio"])
+
         self.model = get_llm()
         self.embed_model = get_embed_model()
         self.index = load_automerging_index_redis(
@@ -111,6 +110,9 @@ def _get_response_str(self, engine_response: RESPONSE_TYPE) -> str:
             """
         else:
             response_str = self._unmask_reference(response_str, nodes)
+
+        if "Step 2:" in response_str:
+            response_str = response_str.split("Step 2:")[1].strip()
 
         return response_str
 
@@ -142,7 +144,10 @@ def _unmask_reference(self, response_str: str, nodes) -> str:
 
 
     def mask_pii(self, message: str) -> str:
-        return self.pii.mask_pii(message)
+        if USE_PRESIDIO:
+            return self.pii.mask_pii(message)
+        else:
+            return message
 
 
     def generate(self, query_str: str) -> str:

diff --git a/apps/chatbot/src/modules/presidio.py b/apps/chatbot/src/modules/presidio.py
@@ -12,7 +12,7 @@
 
 
 # see supported entities by Presidio with their description at: https://microsoft.github.io/presidio/supported_entities/
-ENTITIES = [
+GLOBAL_ENTITIES = [
     "CREDIT_CARD",
     "CRYPTO",
     "DATE_TIME",
@@ -23,21 +23,16 @@
     "LOCATION",
     "PERSON",
     "PHONE_NUMBER",
-    "MEDICAL_LICENSE",
+    "MEDICAL_LICENSE"
+]
+
+IT_ENTITIES = [
     "IT_FISCAL_CODE",
     "IT_DRIVER_LICENSE",
     "IT_VAT_CODE",
     "IT_PASSPORT",
     "IT_IDENTITY_CARD",
-    "IT_PHYSICAL_ADDRESS",  # this is a custom entity added to the analyzer registry
-    # "ES_NIF",
-    # "ES_NIE",
-    # "US_BANK_NUMBER",
-    # "US_DRIVER_LICENSE",
-    # "US_ITIN",
-    # "US_PASSPORT",
-    # "US_SSN",
-    # "UK_NHS"
+    "IT_PHYSICAL_ADDRESS"
 ]
 
 ALLOW_LIST = [
@@ -102,9 +97,10 @@ def __init__(
             analyzer_threshold: float = 0.4
         ):
         self.config = config
+        self.languages = [item["lang_code"] for item in config["models"]]
         self.entity_mapping = entity_mapping
         self.mapping = mapping
-        self.entities = entities if entities else ENTITIES
+        self.entities = entities if entities else GLOBAL_ENTITIES
         self.analyzer_threshold = analyzer_threshold
 
         if isinstance(self.config, (Path, str)):
@@ -117,7 +113,7 @@ def __init__(
         self.nlp_engine = nlp_engine
         self.analyzer = AnalyzerEngine(
             nlp_engine = self.nlp_engine,
-            supported_languages = ["it", "en"], # "es", "fr", "de"
+            supported_languages = self.languages,
             default_score_threshold = analyzer_threshold
         )
         self._add_italian_physical_address_entity()
@@ -136,7 +132,7 @@ def detect_language(self, text: str) -> str:
             detected_languages = detect_langs(text)
             lang_list = []
             for detected_lang in detected_languages:
-                if detected_lang.lang in ["it", "en", "es", "fr", "de"]:
+                if detected_lang.lang in self.languages:
                     lang_list.append(detected_lang.lang)
 
             if not lang_list:
@@ -145,7 +141,7 @@ def detect_language(self, text: str) -> str:
             elif "it" in lang_list:
                 lang = "it"
             else:
-                lang = "en" # lang_list[0].lang            
+                lang = lang_list[0]           
         except:
             logging.warning("No detected language.")
             lang = "it"
@@ -160,7 +156,7 @@ def detect_pii(self, text: str) -> List[RecognizerResult]:
         results = self.analyzer.analyze(
             text=text,
             language=lang,
-            entities=self.entities,
+            entities=self.entities + IT_ENTITIES if lang == "it" else self.entities,
             allow_list=ALLOW_LIST
         )
 

diff --git a/apps/chatbot/src/modules/utils.py b/apps/chatbot/src/modules/utils.py
@@ -19,6 +19,7 @@ def get_ssm_parameter(name: str, default: str | None = None) -> str | None:
     :param default: The default value to return if the parameter is not found.
     :return: The value of the requested parameter.
     """
+
     ssm = boto3.client(
         "ssm",
         aws_access_key_id=AWS_ACCESS_KEY_ID,
@@ -37,4 +38,4 @@ def get_ssm_parameter(name: str, default: str | None = None) -> str | None:
         return default
 
     logging.debug(f"Parameter {name} retrieved from SSM")
-    return response["Parameter"]["Value"]
+    return response["Parameter"]["Value"]
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		#!/bin/bash
		docker compose -f docker/compose.yaml -p chatbot up api
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		#!/bin/bash
		docker run -it --env-file ./.env fastapi-local bash