Spaces:

AIEnergyScore
/

launch-computation-example

Paused

App Files Files Community

meg HF staff commited on Oct 7

Commit

0351a9f

•

1 Parent(s): 07f5bdd

Experimenting.

Browse files

Files changed (1) hide show

entrypoint.sh +14 -6

entrypoint.sh CHANGED Viewed

@@ -4,6 +4,7 @@
 set -e
 export SPACE="EnergyStarAI/launch-computation-example"
 echo "Not checking h100 -- already know it's not there."
 #python /check_h100.py
@@ -14,11 +15,15 @@ python /parse_requests.py | while read line; do
     IFS="," read backend_model experiment_name <<< $(echo ${line})
     echo "Benchmarking Model: ${backend_model}, Task: ${experiment_name}"
     now=$(date +%Y-%m-%d-%H-%M-%S)
-    export run_dir="./runs/" #${experiment_name}/${backend_model}/${now}"
-    optimum-benchmark --config-name ${experiment_name}  --config-dir /optimum-benchmark/examples/energy_star/ backend.model=${backend_model} backend.processor=${backend_model} hydra.run.dir=${run_dir} 2> $run_dir/error-${now}.log
 done || {
     echo "Error."
     # TODO: Although this works, `curl` appears to run indefinitely because it is recording itself (the logs are recording the curl operation.)
     #echo "Using curl to retrieve the space run log."
     #logs_name=./runs/logs-${now}.txt
@@ -26,14 +31,17 @@ done || {
     #python /failed_run.py --run_dir $run_dir --model_name $backend_model --logs_name $logs_name
 }
-if [ -s $run_dir/error-${now}.log ]; then
     # error.log is not-empty, an error was raised
     echo "An error was raised while benchmarking the model..."
     python /failed_run.py --run_dir $run_dir --model_name $backend_model
-#    # Delete the current run directory so that it is not pushed by create_results.py later
-#    rm -rf $run_dir
 else
-  # The file is empty, so no error
   echo "Finished; uploading dataset results"
   python /create_results.py ./runs
 fi

 set -e
 export SPACE="EnergyStarAI/launch-computation-example"
+failed=0
 echo "Not checking h100 -- already know it's not there."
 #python /check_h100.py
     IFS="," read backend_model experiment_name <<< $(echo ${line})
     echo "Benchmarking Model: ${backend_model}, Task: ${experiment_name}"
     now=$(date +%Y-%m-%d-%H-%M-%S)
+    export run_dir="./runs/${experiment_name}/${backend_model}/${now}"
+    mkdir -p $run_dir
+    # Let the benchmarking begin!
+    optimum-benchmark --config-name ${experiment_name}  --config-dir /optimum-benchmark/examples/energy_star/ backend.model=${backend_model} backend.processor=${backend_model} hydra.run.dir=${run_dir} 2> $run_dir/error.log
 done || {
     echo "Error."
+    failed=1
     # TODO: Although this works, `curl` appears to run indefinitely because it is recording itself (the logs are recording the curl operation.)
     #echo "Using curl to retrieve the space run log."
     #logs_name=./runs/logs-${now}.txt
     #python /failed_run.py --run_dir $run_dir --model_name $backend_model --logs_name $logs_name
 }
+if [ -s $run_dir/error.log ]; then
     # error.log is not-empty, an error was raised
     echo "An error was raised while benchmarking the model..."
     python /failed_run.py --run_dir $run_dir --model_name $backend_model
+    # TODO: Is this necessary?
+    # Delete the current run directory so that it is not pushed by create_results.py later
+    rm -rf $run_dir
+elif [ "$failed" -eq 1 ]; then
+  echo "Failed, but was not able to retrieve error log."
 else
+  # The error log file is empty, and we didn't catch an error.
   echo "Finished; uploading dataset results"
   python /create_results.py ./runs
 fi