CodeReviewBench

Sleeping

apsys commited on May 2

Commit

5a2e143

1 Parent(s): 2daa8e2

Update about

Files changed (1) hide show

src/about.py CHANGED Viewed

@@ -19,7 +19,13 @@ Models are evaluated on their ability to properly refuse harmful requests and de
 across multiple categories and test scenarios.
 """
-LLM_BENCHMARKS_TEXT = "CircleGuardBench is the first-of-its-kind benchmark for evaluating the protection capabilities of large language model (LLM) guard systems. It tests how well guard models block harmful content, resist jailbreaks, avoid false positives, and operate efficiently in real-time environments on a taxonomy close to real-world data."
 EVALUATION_QUEUE_TEXT = """
@@ -39,7 +45,7 @@ CITATION_BUTTON_LABEL = "Cite CircleGuardBench"
 CITATION_BUTTON_TEXT = """
 @misc{circleguardbench2025,
   author = {whitecircle-ai},
-  title = {CircleGuardBench: Comprehensive Benchmark for LLM Safety Guardrails},
   year = {2025},
   publisher = {GitHub},
   journal = {GitHub repository},

 across multiple categories and test scenarios.
 """
+LLM_BENCHMARKS_TEXT = """
+CircleGuardBench is the first-of-its-kind benchmark for evaluating the protection capabilities of large language model (LLM) guard systems.
+It tests how well guard models block harmful content, resist jailbreaks, avoid false positives, and operate efficiently in real-time environments on a taxonomy close to real-world data.
+Learn more about us at whitecircle.ai
+"""
 EVALUATION_QUEUE_TEXT = """
 CITATION_BUTTON_TEXT = """
 @misc{circleguardbench2025,
   author = {whitecircle-ai},
+  title = {CircleGuardBench: Comprehensive Benchmark for LLM Safety Guardrails. Learn more about us at whitecircle.ai},
   year = {2025},
   publisher = {GitHub},
   journal = {GitHub repository},