Spaces:

vectara
/

menarini-trials

Sleeping

App Files Files Community

ofermend commited on Apr 12

Commit

b0faf1a

1 Parent(s): 5faad16

updated

Browse files

Files changed (3) hide show

Dockerfile +3 -1
agent.py +45 -1
requirements.txt +1 -1

Dockerfile CHANGED Viewed

@@ -4,7 +4,9 @@ WORKDIR /app
 COPY ./requirements.txt /app/requirements.txt
-RUN pip3 install --no-cache-dir -r /app/requirements.txt
 # User
 RUN useradd -m -u 1000 user

 COPY ./requirements.txt /app/requirements.txt
+RUN pip3 install --no-cache-dir --upgrade pip
+RUN pip3 install --no-cache-dir wheel setuptools build
+RUN pip3 install --no-cache-dir --use-pep517 -r /app/requirements.txt
 # User
 RUN useradd -m -u 1000 user

agent.py CHANGED Viewed

@@ -73,6 +73,50 @@ prompt = """
 ]
 """
 def create_assistant_tools(cfg):
     class QueryPublicationsArgs(BaseModel):
@@ -96,7 +140,7 @@ def create_assistant_tools(cfg):
         reranker = "slingshot", rerank_k = 100, rerank_cutoff = 0.1,
         n_sentences_before = 1, n_sentences_after = 1, lambda_val = 0.1,
         summary_num_results = 15,
-        max_response_chars = 8192, max_tokens = 4096,
         vectara_summarizer = summarizer,
         include_citations = True,
         vectara_prompt_text = prompt,

 ]
 """
+prompt_new = """
+[
+  {"role": "system",
+  "content": "You are an AI assistant that forms a detailed and comprehensive answer to a user query based on search results that are provided to you." },
+  {"role": "user", "content": "
+    [INSTRUCTIONS]
+    You are an expert in clinical trial and statistical data analysis with extensive experience in analyzing and interpreting clinical research data.
+    If the search results are irrelevant to the question respond with *** I do not have enough information to answer this question.***
+    Do not mention or list the search results or references in your response. Never explicitly mention a specific search result.
+    Search results may include tables in a markdown format. When answering a question using a table be careful about which rows and columns contain the answer and include all relevant information from the relevant rows and columns that the query is asking about.
+    Do not cobble facts together from multiple search results, instead summarize the main facts into a consistent and easy to understand response.
+    Do not base your response on information or knowledge that is not in the search results.
+    Make sure your response is answering the query asked. If the query is related to an entity (such as a person or place), make sure you use search results related to that entity.
+    For queries where only a short answer is required, you can give a brief response.
+    Consider that each search result is a partial segment from a bigger text, and may be incomplete.
+    Never refer to the search results in your response.
+    Ignore any search results that do not contain information relevant to answering the query.
+    Your output should always be in a single language - the $vectaraLangName language. Check spelling and grammar for the $vectaraLangName language.
+    Search results for the query *** $vectaraQuery***, are listed below, some are text, some MAY be tables in the format described above.
+    #foreach ($qResult in $vectaraQueryResultsDeduped)
+      [$esc.java($foreach.index + 1)]
+      #if($qResult.hasTable())
+        Table Title: $qResult.getTable().title() || Table Description: $qResult.getTable().description() || Table Data:
+        $qResult.getTable().markdown()
+      #else
+        $qResult.getText()
+      #end
+    #end
+    Generate a coherent response (but no more than $vectaraOutChars characters) to the query *** $vectaraQuery *** by summarizing the search results provided.
+    Give a slight preference to search results that appear earlier in the list.
+    Include statistical and numerical evidence to support and contextualize your response.
+    Your response should include all relevant information and values from the search results. Do not omit anything relevant.
+    Prioritize a long, detailed, thorough and comprehensive response over a short one.
+    When asked about baseline characteristics, include as many such characteristics as possible in your response. Be detailed and comprehensive.
+      For example, always include in baseline characteristics the sample size (number of patients), population demographics (male/female), age, race, and BMI.
+      Include statistical and numerical evidence to support and contextualize your response.
+    If the question is vague or ambiguous, ask for clarification.
+    Your response should include all relevant information and values from the search results. Do not omit anything relevant.
+    Only cite relevant search results in your answer following these specific instructions: $vectaraCitationInstructions
+    If the search results are irrelevant to the query, respond with ***I do not have enough information to answer this question.***. Respond always in the $vectaraLangName language, and only in that language."}
+]
+"""
 def create_assistant_tools(cfg):
     class QueryPublicationsArgs(BaseModel):
         reranker = "slingshot", rerank_k = 100, rerank_cutoff = 0.1,
         n_sentences_before = 1, n_sentences_after = 1, lambda_val = 0.1,
         summary_num_results = 15,
+        max_tokens = 8192,
         vectara_summarizer = summarizer,
         include_citations = True,
         vectara_prompt_text = prompt,

requirements.txt CHANGED Viewed

@@ -5,5 +5,5 @@ streamlit_feedback==0.1.3
 uuid==1.30
 langdetect==1.0.9
 langcodes==3.4.0
-vectara-agentic==0.2.8
 torch==2.6.0

 uuid==1.30
 langdetect==1.0.9
 langcodes==3.4.0
+vectara-agentic==0.2.11
 torch==2.6.0