Spaces:

AIEnergyScore
/

launch-computation-example

Runtime error

App Files Files Community

meg-huggingface commited on Oct 24, 2024

Commit

258cdcb

1 Parent(s): 9cfc9cd

Rolling back to 8 hours ago

Browse files

Files changed (2) hide show

entrypoint.sh +3 -3
failed_run.py +22 -31

entrypoint.sh CHANGED Viewed

@@ -1,6 +1,6 @@
 #!/bin/bash
-export SPACE="AIEnergyScore/launch-computation-example"
 echo "Not checking h100 -- already know it's not there."
 #python /check_h100.py
@@ -19,7 +19,7 @@ python /parse_requests.py | while read -r line; do
     mkdir -p "$run_dir"
     # Let the benchmarking begin!
-    optimum-benchmark --config-name "${experiment_name}"  --config-dir /optimum-benchmark/examples/energy_star/ backend.model="${backend_model}" backend.processor="${backend_model}" hydra.run.dir="${run_dir}" 2> "${run_dir}/error.log" || (python /failed_run.py --run_dir "${run_dir}" --model_name "${backend_model}" && rm -rf $run_dir)     # If the benchmark fails, update accordingly. Remove the run directory for that specific model.
 done
 echo "Finished; uploading dataset results"
@@ -31,4 +31,4 @@ python /upload_run_folder.py --run_dir "/runs"
 # Pausing space
 echo "Pausing space."
 python /pause_space.py
-echo "Done."

 #!/bin/bash
+export SPACE="EnergyStarAI/launch-computation-example"
 echo "Not checking h100 -- already know it's not there."
 #python /check_h100.py
     mkdir -p "$run_dir"
     # Let the benchmarking begin!
+    optimum-benchmark --config-name "${experiment_name}"  --config-dir /optimum-benchmark/examples/energy_star/ backend.model="${backend_model}" backend.processor="${backend_model}" hydra.run.dir="${run_dir}" 2> "${run_dir}/error.log" || (python /failed_run.py --run_dir "${run_dir}" --model_name "${backend_model}" && rm -rf $run_dir)
 done
 echo "Finished; uploading dataset results"
 # Pausing space
 echo "Pausing space."
 python /pause_space.py
+echo "Done."

failed_run.py CHANGED Viewed

@@ -4,7 +4,6 @@ import os
 from datasets import load_dataset, Dataset
 from huggingface_hub import HfApi
 TOKEN = os.environ.get("DEBUG")
 api = HfApi(token=TOKEN)
@@ -23,39 +22,31 @@ parser.add_argument(
     required=True,
     help="Model to benchmark.",
 )
-parser.add_argument(
-    "--reason",
-    default=None,
-    type=str,
-    required=False,
-    help="Reason for failure -- to update in the requests file",
-)
 args = parser.parse_args()
 # Updating request
-dataset = load_dataset("AIEnergyScore/requests_debug", split="test", token=TOKEN).to_pandas()
-## Set benchmark to failed
-# If we have a custom reason for failure, add that instead of generic FAILED.
-if args.reason:
-    dataset.loc[dataset["model"].isin([args.model_name]), ['status']] = args.reason
-else:
-    # TODO: This doesn't have to be try-except, we could actually check if the file is there...
-    try:
-        # Read error message
-        with open(f"{args.run_dir}/error.log", 'r') as file:
-            for f in file.readlines():
-                if 'Traceback (most recent call last):' in f:
-                    error_message = f
-                    dataset.loc[dataset["model"].isin([args.model_name]), ['status']] = "FAILED"
-                    print("Status set to FAILED")
-                else:
-                    dataset.loc[dataset["model"].isin([args.model_name]), ['status']] = "COMPLETED"
-        # Add a new column for the error message if necessary
-    except FileNotFoundError as e:
-        print(f"Could not find {args.run_dir}/error.log")
 updated_dataset = Dataset.from_pandas(dataset)
-updated_dataset.push_to_hub("AIEnergyScore/requests_debug", split="test", token=TOKEN)

 from datasets import load_dataset, Dataset
 from huggingface_hub import HfApi
 TOKEN = os.environ.get("DEBUG")
 api = HfApi(token=TOKEN)
     required=True,
     help="Model to benchmark.",
 )
 args = parser.parse_args()
 # Updating request
+dataset = load_dataset("EnergyStarAI/requests_debug", split="test",
+                       token=TOKEN).to_pandas()
+# Set benchmark to failed
+# TODO: This doesn't have to be try-except, we could actually check if the file is there.
+try:
+    # Read error message
+    with open(f"{args.run_dir}/error.log", 'r') as file:
+        for f in file.readlines():
+            if 'Traceback (most recent call last):' in f:
+                error_message = f
+                dataset.loc[dataset["model"].isin([args.model_name]), [
+                    'status']] = "FAILED"
+                print("Status set to FAILED")
+            else:
+                dataset.loc[dataset["model"].isin([args.model_name]), [
+                    'status']] = "COMPLETED"
+    # Add a new column for the error message if necessary
+except FileNotFoundError as e:
+    print(f"Could not find {args.run_dir}/error.log")
 updated_dataset = Dataset.from_pandas(dataset)
+updated_dataset.push_to_hub("EnergyStarAI/requests_debug", split="test",
+                            token=TOKEN)