Final_Assignment_Template3

Sleeping

App Files Files Community

bwilkie commited on Aug 9

Commit

8cb575b

verified ·

1 Parent(s): 7d8f8f7

Update multiagents.py

Browse files

Files changed (1) hide show

multiagents.py +52 -20

multiagents.py CHANGED Viewed

@@ -59,32 +59,64 @@ dotenv.load_dotenv()
 grok_api_key = os.getenv("groq_api")
-#InferenceClientModel InferenceClient
-My_Agent = InferenceClientModel(
     provider="groq",
     api_key=grok_api_key,
-    model_id = "qwen/qwen3-32b"
 )
-# test_messages = [{"role": "user", "content": "What are the 3 laws of robotics"}]
-# output_test = My_Agent(test_messages)
-# print('1', output_test)
-# My_Agent = client.chat.completions.create(
-#     model="qewn/qwen3-32b",
-#     messages=[
-#         {
-#             "role": "user",
-#             "content": "How many 'G's in 'huggingface'?"
-#         }
-#     ],
-# )
 def check_final_answer(final_answer, agent_memory)  -> bool:
     """

+# Rate limiting decorator
+def rate_limit(calls_per_minute=15):
+    """Rate limiting decorator that limits function calls per minute"""
+    def decorator(func):
+        call_times = []
+        @wraps(func)
+        def wrapper(*args, **kwargs):
+            now = time.time()
+            # Remove calls older than 1 minute
+            call_times[:] = [t for t in call_times if now - t < 60]
+            if len(call_times) >= calls_per_minute:
+                sleep_time = 60 - (now - call_times[0])
+                if sleep_time > 0:
+                    mylog("rate_limit", f"Rate limit reached. Sleeping for {sleep_time:.2f} seconds")
+                    time.sleep(sleep_time)
+                    # Clean up old calls again after sleeping
+                    now = time.time()
+                    call_times[:] = [t for t in call_times if now - t < 60]
+            call_times.append(now)
+            return func(*args, **kwargs)
+        return wrapper
+    return decorator
+# Rate-limited model wrapper
+class RateLimitedModel:
+    def __init__(self, model, calls_per_minute=30):
+        self.model = model
+        self.calls_per_minute = calls_per_minute
+        self.call_times = []
+    def __call__(self, messages, **kwargs):
+        return self._rate_limited_call(messages, **kwargs)
+    @rate_limit(calls_per_minute=30)  # Adjust as needed
+    def _rate_limited_call(self, messages, **kwargs):
+        return self.model(messages, **kwargs)
+    def __getattr__(self, name):
+        # Delegate other attributes to the wrapped model
+        return getattr(self.model, name)
+###################
 grok_api_key = os.getenv("groq_api")
+# Base model
+base_model = InferenceClientModel(
     provider="groq",
     api_key=grok_api_key,
+    model_id="qwen/qwen3-32b"
 )
+# Wrap with rate limiting
+My_Agent = RateLimitedModel(base_model, calls_per_minute=15)
 def check_final_answer(final_answer, agent_memory)  -> bool:
     """