Spaces:

gathnex
/

rag-demo

Running

App Files Files Community

gathnex commited on Nov 27, 2023

Commit

e1bc29c

1 Parent(s): 0c611b8

Initial commit

Browse files

Files changed (6) hide show

Dockerfile +14 -0
__init__.py +0 -0
credentials.env +4 -0
main.py +17 -0
rag_retriver.py +49 -0
requirements.txt +7 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,14 @@

+FROM python:3.9
+WORKDIR /code
+COPY ./requirements.txt /code/requirements.txt
+RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
+COPY  ./__init__.py /code/__init__.py
+COPY ./credentials.env /code/credentials.env
+COPY ./rag_retriver.py /code/rag_retriver.py
+COPY ./main.py /code/main.py
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

__init__.py ADDED Viewed

File without changes

credentials.env ADDED Viewed

	@@ -0,0 +1,4 @@

+openai_api = "openai api key"
+Pinecone_api_key = "Pinecone api key"
+Pinecone_environment = "gcp-starter"
+index_name = "index name"

main.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from rag_retriver import Vector_search, GPT_completion_with_vector_search
+from fastapi import FastAPI
+from pydantic import BaseModel
+#Pydantic object
+class validation(BaseModel):
+    prompt: str
+#Fast API
+app = FastAPI()
+@app.post("/Gathnex_Rag_System")
+async def retrival_augmented_generation(item: validation):
+    rag = Vector_search(item.prompt)
+    completion = GPT_completion_with_vector_search(item.prompt, rag)
+    return completion

rag_retriver.py ADDED Viewed

	@@ -0,0 +1,49 @@

+import pinecone
+from openai import OpenAI
+from dotenv import dotenv_values
+#Loading Credentials
+env_name = "credentials.env"
+config = dotenv_values(env_name)
+client = OpenAI(api_key= config["openai_api"])
+#Connection
+index_name = config["index_name"]
+# initialize connection to pinecone (get API key at app.pinecone.io)
+pinecone.init(
+    api_key =  config["Pinecone_api_key"],
+    environment =  config["Pinecone_environment"]
+)
+index = pinecone.Index(index_name)
+#Vector Search
+def Vector_search(query):
+  Rag_data = ""
+  xq = client.embeddings.create(input=query,model="text-embedding-ada-002")
+  res = index.query([xq.data[0].embedding], top_k=2, include_metadata=True)
+  for match in res['matches']:
+      if match['score'] < 0.80:
+        continue
+      Rag_data += match['metadata']['text']
+  return Rag_data
+#GPT Completion
+def GPT_completion_with_vector_search(prompt, rag):
+    DEFAULT_SYSTEM_PROMPT = '''You are a helpful, respectful and honest INTP-T AI Assistant named Gathnex AI. You are talking to a human User.
+    Always answer as helpfully and logically as possible, while being safe. Your answers should not include any harmful, political, religious, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.
+    If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.
+    You also have access to RAG vectore database access which has Indian Law data. Be careful when giving response, sometime irrelevent Rag content will be there so give response effectivly to user based on the prompt.
+    You can speak fluently in English.
+    Note: Sometimes the Context is not relevant to Question, so give Answer according to that based on sutiation.
+    '''
+    response = client.chat.completions.create(
+    model="gpt-3.5-turbo-1106",
+    messages=[
+        {f"role": "system", "content": DEFAULT_SYSTEM_PROMPT},
+        {f"role": "user", "content": rag +", Prompt: "+ prompt},
+    ]
+    )
+    return response.choices[0].message.content

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+openai
+python-multipart
+fastapi
+pydantic
+uvicorn
+python-dotenv
+pinecone-client