Spaces:

real-jiakai
/

Agent_Course_Final_Assignment_Demo

Paused

App Files Files Community

real-jiakai commited on Apr 26

Commit

0aa600f

verified ·

1 Parent(s): fa599aa

Update agent.py

Browse files

Files changed (1) hide show

agent.py +9 -24

agent.py CHANGED Viewed

@@ -124,38 +124,25 @@ All answers are graded by exact string match, so format carefully!"""
     def __call__(self, prompt: str, **kwargs) -> str:
         """
         Call the model with appropriate handling of system prompts for Anthropic
-        Args:
-            prompt: The prompt to send to the model
-            **kwargs: Additional arguments to pass to LiteLLM
-        Returns:
-            The model's response as a string
         """
         # Wait according to rate limiter
         RATE_LIMITER.wait()
         try:
-            # For Anthropic models, we need to modify how system prompts are handled
-            # We do this by using the 'messages' parameter directly with the system content
-            # Extract system_instruction from kwargs if it exists and remove it
-            # (to avoid the "Extra inputs are not permitted" error)
             if 'system_instruction' in kwargs:
-                # We'll ignore it and use our stored system prompt instead
                 del kwargs['system_instruction']
-            # Create our messages array with the system message and user prompt
-            messages = [
-                {"role": "system", "content": self.system_prompt},
-                {"role": "user", "content": prompt}
-            ]
-            # Call LiteLLM with the proper message format for Anthropic
             from litellm import completion
             response = completion(
                 model=self.model_id,
-                messages=messages,
                 api_key=self.api_key,
                 temperature=self.temperature,
                 max_tokens=self.max_tokens,
@@ -166,15 +153,13 @@ All answers are graded by exact string match, so format carefully!"""
             return response.choices[0].message.content
         except Exception as e:
             if "rate_limit" in str(e).lower():
-                # Specific handling for rate limit errors
                 print(f"Rate limit error: {e}")
                 print("Waiting 60 seconds before retrying...")
                 time.sleep(60)
-                # Recursive retry after waiting
                 return self.__call__(prompt, **kwargs)
             else:
-                # Re-raise other errors
                 print(f"Error calling Anthropic API: {e}")
                 raise

     def __call__(self, prompt: str, **kwargs) -> str:
         """
         Call the model with appropriate handling of system prompts for Anthropic
         """
         # Wait according to rate limiter
         RATE_LIMITER.wait()
         try:
+            # Remove system_instruction if present in kwargs
             if 'system_instruction' in kwargs:
                 del kwargs['system_instruction']
+            # For Anthropic via LiteLLM, use the direct completion method
             from litellm import completion
+            # Create a simple prompt with system instructions at the beginning
+            # This avoids the nested message structure issue
+            complete_prompt = f"{self.system_prompt}\n\n{prompt}"
             response = completion(
                 model=self.model_id,
+                messages=[{"role": "user", "content": complete_prompt}],
                 api_key=self.api_key,
                 temperature=self.temperature,
                 max_tokens=self.max_tokens,
             return response.choices[0].message.content
         except Exception as e:
+            # Handle rate limit errors
             if "rate_limit" in str(e).lower():
                 print(f"Rate limit error: {e}")
                 print("Waiting 60 seconds before retrying...")
                 time.sleep(60)
                 return self.__call__(prompt, **kwargs)
             else:
                 print(f"Error calling Anthropic API: {e}")
                 raise