Language models demonstrate powerful capabilities and pose
significant risks. Given their widespread deployment, standardized
@@ -20,12 +27,12 @@ export default function SafetyLanding() {
closed models.
- {/*
Blog Post
- */}
+
Full Leaderboard
diff --git a/helm-frontend/src/components/MediaObjectDisplay.tsx b/helm-frontend/src/components/MediaObjectDisplay.tsx
index 469fcd1bd7..a92b131886 100644
--- a/helm-frontend/src/components/MediaObjectDisplay.tsx
+++ b/helm-frontend/src/components/MediaObjectDisplay.tsx
@@ -21,6 +21,20 @@ export default function MediaObjectDisplay({ mediaObject }: Props) {
);
+ } else if (mediaObject.content_type.includes("audio")) {
+ if (mediaObject.location === undefined) {
+ return null;
+ }
+ const url = getBenchmarkEndpoint(
+ mediaObject.location
+ .replace("benchmark_output/", "")
+ .replace("prod_env/", "../"),
+ );
+ return (
+
+ );
} else {
if (
mediaObject.text &&
diff --git a/helm-frontend/src/components/NavDropdown.tsx b/helm-frontend/src/components/NavDropdown.tsx
index d1b8ae07aa..486edd593e 100644
--- a/helm-frontend/src/components/NavDropdown.tsx
+++ b/helm-frontend/src/components/NavDropdown.tsx
@@ -9,6 +9,22 @@ function NavDropdown() {
ProjectMetadata | undefined
>();
+ useEffect(() => {
+ if (
+ currProjectMetadata &&
+ currProjectMetadata.title &&
+ currProjectMetadata.title !== "All Leaderboards"
+ ) {
+ const titlePrefix =
+ currProjectMetadata.title === "Lite" ||
+ currProjectMetadata.title === "Classic"
+ ? "HELM " + currProjectMetadata.title
+ : currProjectMetadata.title;
+ document.title =
+ titlePrefix + " - Holistic Evaluation of Language Models (HELM)";
+ }
+ }, [currProjectMetadata]);
+
useEffect(() => {
fetch(
"https://raw.githubusercontent.com/stanford-crfm/helm/main/helm-frontend/project_metadata.json",
diff --git a/helm-frontend/src/components/ReleaseDropdown.tsx b/helm-frontend/src/components/ReleaseDropdown.tsx
index 7e648b56ea..6258de2ee3 100644
--- a/helm-frontend/src/components/ReleaseDropdown.tsx
+++ b/helm-frontend/src/components/ReleaseDropdown.tsx
@@ -1,3 +1,4 @@
+import { Badge } from "@tremor/react";
import { useEffect, useState } from "react";
import getReleaseSummary from "@/services/getReleaseSummary";
import ReleaseSummary from "@/types/ReleaseSummary";
@@ -40,13 +41,6 @@ function ReleaseDropdown() {
});
}, []);
- function getReleases(): string[] {
- return currProjectMetadata !== undefined &&
- currProjectMetadata.releases !== undefined
- ? currProjectMetadata.releases
- : ["v1.0.0"];
- }
-
useEffect(() => {
const controller = new AbortController();
async function fetchData() {
@@ -58,20 +52,34 @@ function ReleaseDropdown() {
return () => controller.abort();
}, []);
- const releases = getReleases();
+ const releases =
+ currProjectMetadata !== undefined &&
+ currProjectMetadata.releases !== undefined
+ ? currProjectMetadata.releases
+ : ["v1.0.0"];
- if (!summary.release && !summary.suite) {
+ const currentVersion = summary.release || summary.suite || null;
+
+ if (!currentVersion) {
return null;
}
- const releaseInfo = `Release ${summary.release || summary.suite} (${
- summary.date
- })`;
+ const releaseInfo = `Release ${currentVersion} (${summary.date})`;
if (releases.length <= 1) {
return
;
}
+ const indexOfCurrentVersion = releases.indexOf(currentVersion);
+
+ const badge =
+ indexOfCurrentVersion < 0 ? (
+