OpenSearch-AI

Running on CPU Upgrade

prasadnu commited on Jun 26

Commit

d1e16b2

1 Parent(s): 33fcb20

model changed to Haiku 3.5 for query re=write

Files changed (2) hide show

semantic_search/query_rewrite.py CHANGED Viewed

@@ -235,18 +235,18 @@ def get_new_query_res(query):
     if(query == ""):
         query = st.session_state.input_rekog_label
     if(st.session_state.input_is_rewrite_query == 'enabled'):
-        start = time.time()
         get_prompt = prompt_.format(query=query,schema = schema)
-        print(f"prompt latency: {time.time() - start:.2f} sec")
-        start = time.time()
         res = invoke_models.invoke_llm_model( get_prompt,False)
-        print(f"Claude latency: {time.time() - start:.2f} sec")
         inter_query = res[7:-3].replace('\\"',"'").replace("\n","")
-        start = time.time()
         query_struct = StructuredQueryOutputParser.from_components().parse(inter_query)
         opts = OpenSearchTranslator()
         result_query_llm = opts.visit_structured_query(query_struct)[1]['filter']
-        print(f"Langchain latency: {time.time() - start:.2f} sec")
         draft_new_query = {'bool':{'should':[],'must':[]}}
         if('bool' in result_query_llm and ('must' in result_query_llm['bool'] or 'should' in result_query_llm['bool'])):
             #draft_new_query['bool']['should'] = []

     if(query == ""):
         query = st.session_state.input_rekog_label
     if(st.session_state.input_is_rewrite_query == 'enabled'):
+        #tart = time.time()
         get_prompt = prompt_.format(query=query,schema = schema)
+        #print(f"prompt latency: {time.time() - start:.2f} sec")
+        #start = time.time()
         res = invoke_models.invoke_llm_model( get_prompt,False)
+        #print(f"Claude latency: {time.time() - start:.2f} sec")
         inter_query = res[7:-3].replace('\\"',"'").replace("\n","")
+        #start = time.time()
         query_struct = StructuredQueryOutputParser.from_components().parse(inter_query)
         opts = OpenSearchTranslator()
         result_query_llm = opts.visit_structured_query(query_struct)[1]['filter']
+        #print(f"Langchain latency: {time.time() - start:.2f} sec")
         draft_new_query = {'bool':{'should':[],'must':[]}}
         if('bool' in result_query_llm and ('must' in result_query_llm['bool'] or 'should' in result_query_llm['bool'])):
             #draft_new_query['bool']['should'] = []

utilities/invoke_models.py CHANGED Viewed

@@ -108,7 +108,7 @@ def read_from_table(file,question):
     model = BedrockChat(
     client=bedrock_runtime_client,
-    model_id='anthropic.claude-3-haiku-20240307-v1:0',
     model_kwargs=bedrock_params,
     streaming=False
     )
@@ -130,7 +130,7 @@ def generate_image_captions_llm(base64_string,question):
     response = bedrock_runtime_client.invoke_model(
-            modelId= "anthropic.claude-3-haiku-20240307-v1:0",
             contentType = "application/json",
             accept = "application/json",

     model = BedrockChat(
     client=bedrock_runtime_client,
+    model_id="anthropic.claude-3-5-haiku-20241022-v1:0",
     model_kwargs=bedrock_params,
     streaming=False
     )
     response = bedrock_runtime_client.invoke_model(
+            modelId= "anthropic.claude-3-5-haiku-20241022-v1:0",
             contentType = "application/json",
             accept = "application/json",