Spaces:

alexandrainst
/

radial-plot-generator

Running

App Files Files Community

saattrupdan commited on Sep 6

Commit

a27fbcc

1 Parent(s): 376f461

fix: Fetch data from tar.gz file

Browse files

Files changed (1) hide show

app.py +22 -6

app.py CHANGED Viewed

@@ -1,9 +1,11 @@
 """Script to produce radial plots."""
 from functools import partial
 import plotly.graph_objects as go
 import json
 import numpy as np
 from collections import defaultdict
 import pandas as pd
 from pydantic import BaseModel
@@ -782,19 +784,33 @@ def fetch_results() -> dict[Language, pd.DataFrame]:
     Returns:
         A dictionary of languages -> results-dataframes, whose indices are the
         models and columns are the tasks.
     """
     logger.info("Fetching results from EuroEval benchmark...")
     response = requests.get(
         "https://raw.githubusercontent.com/EuroEval/leaderboards/refs/heads/main"
-        "/results/results.jsonl"
     )
     response.raise_for_status()
-    records = [
-        json.loads(dct_str)
-        for dct_str in response.text.split("\n")
-        if dct_str.strip("\n")
-    ]
     # Build a dictionary of languages -> results-dataframes, whose indices are the
     # models and columns are the tasks.

 """Script to produce radial plots."""
 from functools import partial
+import io
 import plotly.graph_objects as go
 import json
 import numpy as np
+import tarfile
 from collections import defaultdict
 import pandas as pd
 from pydantic import BaseModel
     Returns:
         A dictionary of languages -> results-dataframes, whose indices are the
         models and columns are the tasks.
+    Raises:
+        FileNotFoundError:
+            If the results.jsonl file is not found in the tar.gz file.
+        HTTPError:
+            If there is an error fetching the results from GitHub.
     """
     logger.info("Fetching results from EuroEval benchmark...")
+    # Get the tar.gz file containing the results
     response = requests.get(
         "https://raw.githubusercontent.com/EuroEval/leaderboards/refs/heads/main"
+        "/results.tar.gz"
     )
     response.raise_for_status()
+    compressed_file = io.BytesIO(response.content)
+    # Unpack the tar.gz file in memory and read the JSONL file
+    with tarfile.open(fileobj=compressed_file, mode="r:gz") as tar:
+        results_file = tar.extractfile(member="results/results.jsonl")
+        if results_file is None:
+            raise FileNotFoundError(
+                "results/results.jsonl not found in the tar.gz file."
+            )
+        result_lines = results_file.read().decode(encoding="utf-8").splitlines()
+    records = [json.loads(dct_str) for dct_str in result_lines if dct_str.strip("\n")]
     # Build a dictionary of languages -> results-dataframes, whose indices are the
     # models and columns are the tasks.