Spaces:

valory
/

olas-prediction-leaderboard

Runtime error

richardblythman commited on Apr 17, 2024

Commit

b871994

1 Parent(s): c4e55cd

fix bug

Files changed (2) hide show

app.py CHANGED Viewed

@@ -87,13 +87,6 @@ with demo:
         with gr.TabItem("🚀 Contribute"):
             gr.Markdown(how_to_run)
-        def update_dropdown(tool):
-            if "claude" in tool:
-                return ["claude-3-haiku-20240307", "claude-3-sonnet-20240229", "claude-3-opus-20240229"]
-            else:
-                return ["gpt-3.5-turbo-0125", "gpt-4-0125-preview"]
         # fourth tab - run the benchmark
         with gr.TabItem("🔥 Run the Benchmark"):
             with gr.Row():
@@ -106,14 +99,14 @@ with demo:
                         # "prediction-online-sme",
                         'prediction-request-rag',
                         'prediction-request-reasoning',
-                        "prediction-url-cot-claude",
                         # "prediction-request-rag-cohere",
                         # "prediction-with-research-conservative",
                         # "prediction-with-research-bold",
                     ], label="Tool Name", info="Choose the tool to run")
                 model_name = gr.Dropdown([
                     "gpt-3.5-turbo-0125",
-                    "gpt-4-0125-preview"
                     "claude-3-haiku-20240307",
                     "claude-3-sonnet-20240229",
                     "claude-3-opus-20240229",

         with gr.TabItem("🚀 Contribute"):
             gr.Markdown(how_to_run)
         # fourth tab - run the benchmark
         with gr.TabItem("🔥 Run the Benchmark"):
             with gr.Row():
                         # "prediction-online-sme",
                         'prediction-request-rag',
                         'prediction-request-reasoning',
+                        # "prediction-url-cot-claude",
                         # "prediction-request-rag-cohere",
                         # "prediction-with-research-conservative",
                         # "prediction-with-research-bold",
                     ], label="Tool Name", info="Choose the tool to run")
                 model_name = gr.Dropdown([
                     "gpt-3.5-turbo-0125",
+                    "gpt-4-0125-preview",
                     "claude-3-haiku-20240307",
                     "claude-3-sonnet-20240229",
                     "claude-3-opus-20240229",

tabs/run_benchmark.py CHANGED Viewed

@@ -30,6 +30,10 @@ def run_benchmark_main(tool_name, model_name, num_questions, openai_api_key, ant
     else:
         kwargs["llm_provider"] = "openrouter"
     kwargs["num_urls"] = 3
     kwargs["num_words"] = 300
     kwargs["provide_source_links"] = True

     else:
         kwargs["llm_provider"] = "openrouter"
+    if tool_name == "prediction-request-reasoning" or tool_name == "prediction-request-rag":
+        if not openai_api_key:
+            return f"Error: Tools that use RAG also require an OpenAI API Key"
     kwargs["num_urls"] = 3
     kwargs["num_words"] = 300
     kwargs["provide_source_links"] = True