diff --git a/applications/rag/frontend/container/Dockerfile b/applications/rag/frontend/container/Dockerfile
index a9cd73be4..d7aa7b886 100644
--- a/applications/rag/frontend/container/Dockerfile
+++ b/applications/rag/frontend/container/Dockerfile
@@ -22,6 +22,6 @@ RUN pip install -r requirements.txt
 EXPOSE 8080
 
 ENV FLASK_APP=/workspace/frontend/main.py
-ENV PYTHONPATH=.
+ENV PYTHONPATH=/workspace/frontend/
 # Run the application with Gunicorn
 CMD ["gunicorn", "-w", "4", "-b", "0.0.0.0:8080", "main:app"]
diff --git a/applications/rag/frontend/container/application/utils/cloud_sql_utils.py b/applications/rag/frontend/container/application/utils/cloud_sql_utils.py
index 44a2ca061..009bbcb94 100644
--- a/applications/rag/frontend/container/application/utils/cloud_sql_utils.py
+++ b/applications/rag/frontend/container/application/utils/cloud_sql_utils.py
@@ -22,13 +22,18 @@
 import os
 import logging
 
+import google.cloud.logging as gcloud_logging
+
 from google.cloud.sql.connector import IPTypes
 
-from langchain_google_cloud_sql_pg import PostgresEngine, PostgresVectorStore
+from langchain_google_cloud_sql_pg import PostgresEngine
 
 logging.basicConfig(
     level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s"
 )
+gcloud_logging_client = gcloud_logging.Client()
+gcloud_logging_client.setup_logging()
+
 
 ENVIRONMENT = os.environ.get("ENVIRONMENT")
 
@@ -38,7 +43,7 @@
 
 DB_NAME = os.environ.get("DB_NAME", "pgvector-database")
 VECTOR_EMBEDDINGS_TABLE_NAME = os.environ.get("EMBEDDINGS_TABLE_NAME", "")
-CHAT_HISTORY_TABLE_NAME = os.environ.get("CHAT_HISTORY_TABLE_NAME", "chat_history_store")
+CHAT_HISTORY_TABLE_NAME = os.environ.get("CHAT_HISTORY_TABLE_NAME", "message_store")
 
 VECTOR_DIMENSION = os.environ.get("VECTOR_DIMENSION", 384)
 
@@ -66,13 +71,17 @@ def create_sync_postgres_engine():
         ip_type=IPTypes.PUBLIC if ENVIRONMENT == "development" else IPTypes.PRIVATE,
     )
     try:
-        engine.init_chat_history_table(table_name=CHAT_HISTORY_TABLE_NAME)
         engine.init_vectorstore_table(
             VECTOR_EMBEDDINGS_TABLE_NAME,
             vector_size=VECTOR_DIMENSION,
             overwrite_existing=False,
         )
-    except Exception as e:
-        logging.info(f"Error: {e}")
+    except Exception as err:
+        logging.error(f"Error: {err}")
+
+    try:
+        engine.init_chat_history_table(table_name=CHAT_HISTORY_TABLE_NAME)
 
+    except Exception as err:
+        logging.error(f"Error: {err}")
     return engine
diff --git a/applications/rag/frontend/container/application/vector_storages/cloud_sql.py b/applications/rag/frontend/container/application/vector_storages/cloud_sql.py
index b37724212..603b2ec46 100644
--- a/applications/rag/frontend/container/application/vector_storages/cloud_sql.py
+++ b/applications/rag/frontend/container/application/vector_storages/cloud_sql.py
@@ -65,8 +65,8 @@ def add_texts(
             splits = self.splitter.split_documents(texts)
             ids = [str(uuid.uuid4()) for _ in range(len(splits))]
             self.vector_store.add_documents(splits, ids)
-        except Exception as e:
-            logging.info(f"Error: {e}")
+        except Exception as err:
+            logging.error(f"Error: {err}")
             raise Exception(f"Error adding texts: {err}")
 
     def similarity_search(
@@ -79,4 +79,5 @@ def similarity_search(
             return docs
 
         except Exception as err:
+            logging.error(f"Something happened: {err}")
             raise Exception(f"Error on similarity search: {err}")
diff --git a/applications/rag/frontend/container/rag_langchain/rag_chain.py b/applications/rag/frontend/container/rag_langchain/rag_chain.py
deleted file mode 100644
index 807c875c8..000000000
--- a/applications/rag/frontend/container/rag_langchain/rag_chain.py
+++ /dev/null
@@ -1,136 +0,0 @@
-# Copyright 2024 Google LLC
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import os
-from typing import (Dict)
-from cloud_sql.cloud_sql import CHAT_HISTORY_TABLE_NAME, init_connection_pool, create_sync_postgres_engine, CustomVectorStore
-from google.cloud.sql.connector import Connector
-from langchain_community.llms.huggingface_text_gen_inference import HuggingFaceTextGenInference
-from langchain_community.embeddings.huggingface import HuggingFaceEmbeddings
-from langchain_core.prompts import PromptTemplate
-from langchain_core.runnables import RunnableParallel, RunnableLambda
-from langchain_core.runnables.history import RunnableWithMessageHistory
-from langchain_google_cloud_sql_pg import PostgresChatMessageHistory
-
-QUESTION = "question"
-HISTORY = "history"
-CONTEXT = "context"
-
-INFERENCE_ENDPOINT=os.environ.get('INFERENCE_ENDPOINT', '127.0.0.1:8081')
-SENTENCE_TRANSFORMER_MODEL = 'intfloat/multilingual-e5-small' # Transformer to use for converting text chunks to vector embeddings
-
-
-# TODO use a chat model instead of an LLM in the chain. Convert the prompt to a chat prompt template
-# prompt = ChatPromptTemplate.from_messages(
-#     [
-#         ("system", """You help everyone by answering questions, and improve your answers from previous answers in history. 
-#          You stick to the facts by basing your answers off of the context provided:"""),
-#         MessagesPlaceholder(variable_name="history"),
-#         MessagesPlaceholder(variable_name="context"),
-#         ("human", "{question}"),
-#     ]    
-# )
-template = """Answer the Question given by the user. Keep the answer to no more than 2 sentences. 
-Improve upon your previous answers using History, a list of messages. 
-Messages of type HumanMessage were asked by the user, and messages of type AIMessage were your previous responses.
-Stick to the facts by basing your answers off of the Context provided.
-Be brief in answering.
-History: {""" + HISTORY + "}\n\nContext: {" + CONTEXT + "}\n\nQuestion: {" + QUESTION + "}\n"
-
-prompt = PromptTemplate(template=template, input_variables=[HISTORY, CONTEXT, QUESTION])
-
-engine = create_sync_postgres_engine()
-# TODO: Dict is not safe for multiprocessing. Introduce a cache using Flask-caching or libcache
-# The in-memory SimpleCache implementations for each of these libraries is not safe either. 
-# Consider redis or memcached (e.g., Memorystore)
-# chat_history_map: Dict[str, PostgresChatMessageHistory] = {}
-
-def get_chat_history(session_id: str) -> PostgresChatMessageHistory:
-    history = PostgresChatMessageHistory.create_sync(
-        engine,
-        session_id=session_id,
-        table_name = CHAT_HISTORY_TABLE_NAME
-    )
-
-    print(f"Retrieving history for session {session_id} with {len(history.messages)}")
-    return history
-
-def clear_chat_history(session_id: str):
-    history = PostgresChatMessageHistory.create_sync(
-        engine,
-        session_id=session_id,
-        table_name = CHAT_HISTORY_TABLE_NAME
-    )    
-    history.clear()
-
-
-#TODO: limit number of tokens in prompt to MAX_INPUT_LENGTH 
-# (as specified in hugging face TGI input parameter)
-
-def create_chain() -> RunnableWithMessageHistory: 
-    # TODO HuggingFaceTextGenInference class is deprecated. 
-    # The warning is: 
-    #                The class `langchain_community.llms.huggingface_text_gen_inference.HuggingFaceTextGenInference` 
-    #                was deprecated in langchain-community 0.0.21 and will be removed in 0.2.0. Use HuggingFaceEndpoint instead
-    # The replacement is HuggingFace Endoint, which requires a huggingface
-    # hub API token. Either need to add the token to the environment, or need to find a method to call TGI
-    # without the token.
-    # Example usage of HuggingFaceEndpoint:
-    # llm = HuggingFaceEndpoint(
-    #                 endpoint_url=f'http://{INFERENCE_ENDPOINT}/',
-    #                 max_new_tokens=512,
-    #                 top_k=10,
-    #                 top_p=0.95,
-    #                 typical_p=0.95,
-    #                 temperature=0.01,
-    #                 repetition_penalty=1.03,
-    #                 huggingfacehub_api_token="my-api-key"
-    #             )
-    # TODO: Give guidance on what these parameters should be and describe why these values were chosen.
-    model = HuggingFaceTextGenInference(
-        inference_server_url=f'http://{INFERENCE_ENDPOINT}/',
-        max_new_tokens=512,
-        top_k=10,
-        top_p=0.95,
-        typical_p=0.95,
-        temperature=0.01,
-        repetition_penalty=1.03,
-    )
-
-    langchain_embed = HuggingFaceEmbeddings(model_name=SENTENCE_TRANSFORMER_MODEL)
-    vector_store = CustomVectorStore(langchain_embed, init_connection_pool(Connector()))
-    retriever = vector_store.as_retriever()
-
-    setup_and_retrieval = RunnableParallel(
-        {
-            "context": retriever, 
-            QUESTION: RunnableLambda(lambda d: d[QUESTION]), 
-            HISTORY: RunnableLambda(lambda d: d[HISTORY])
-        }
-    )
-    chain = setup_and_retrieval | prompt | model
-    chain_with_history = RunnableWithMessageHistory(
-        chain,
-        get_chat_history,
-        input_messages_key=QUESTION,
-        history_messages_key=HISTORY,
-        output_messages_key="output"
-    )
-    return chain_with_history
-
-def take_chat_turn(chain: RunnableWithMessageHistory, session_id: str, query_text: str) -> str:
-    #TODO limit the number of history messages
-    config = {"configurable": {"session_id": session_id}}
-    result = chain.invoke({"question": query_text}, config)
-    return str(result)
\ No newline at end of file