Spaces:

mlabonne
/

llm-auto-eval

Sleeping

App Files Files Community

mlabonne commited on Mar 28

Commit

44b82da

•

1 Parent(s): 05dd18e

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -4

app.py CHANGED Viewed

@@ -12,10 +12,10 @@ TITLE = """
 <p><em>Once a pod has started, you can safely close this tab. The results are then privately uploaded to <a href="https://gist.github.com/">GitHub Gist</a>, and the pod is automatically destroyed.</em></p>
 """
-def autoeval(BENCHMARK, MODEL, GPU, NUMBER_OF_GPUS, CONTAINER_DISK, CLOUD_TYPE, REPO, TRUST_REMOTE_CODE, DEBUG, GITHUB_API_TOKEN, RUNPOD_TOKEN):
     runpod.api_key = RUNPOD_TOKEN
     pod = runpod.create_pod(
-        name=f"Eval {MODEL.split('/')[-1]} on {BENCHMARK.capitalize()}",
         image_name="runpod/pytorch:2.0.1-py3.10-cuda11.8.0-devel-ubuntu22.04",
         gpu_type_id=GPU,
         cloud_type=CLOUD_TYPE,
@@ -25,7 +25,7 @@ def autoeval(BENCHMARK, MODEL, GPU, NUMBER_OF_GPUS, CONTAINER_DISK, CLOUD_TYPE,
         template_id="au6nz6emhk",
         env={
             "BENCHMARK": BENCHMARK,
-            "MODEL_ID": MODEL,
             "REPO": REPO,
             "TRUST_REMOTE_CODE": TRUST_REMOTE_CODE,
             "DEBUG": DEBUG,
@@ -42,7 +42,7 @@ with gr.Blocks() as demo:
         gr.Textbox("", label="Model", value="mlabonne/NeuralBeagle14-7B", info="ID of the model you want to evaluate", placeholder="mlabonne/NeuralBeagle14-7B"),
         gr.Dropdown(GPU_LIST, label="GPU", value="NVIDIA GeForce RTX 3090", info="Select your GPU to run the evaluation"),
         gr.Slider(minimum=1, maximum=8, value=1, step=1, label="Number of GPUs", info="Number of GPUs to use"),
-        gr.Slider(minimum=50, maximum=500, value=100, step=25, label="Container disk", info="Size of the container disk in GB"),
         gr.Dropdown(["COMMUNITY", "SECURE"], value="COMMUNITY", label="Cloud type", info="Select your cloud type"),
         gr.Textbox("https://github.com/mlabonne/llm-autoeval.git", label="LLM AutoEval repo", info="Link to your LLM AutoEval repo"),
         gr.Checkbox(label="Trust remote code", value=False, info="Required for some models like phi-2"),

 <p><em>Once a pod has started, you can safely close this tab. The results are then privately uploaded to <a href="https://gist.github.com/">GitHub Gist</a>, and the pod is automatically destroyed.</em></p>
 """
+def autoeval(BENCHMARK, MODEL_ID, GPU, NUMBER_OF_GPUS, CONTAINER_DISK, CLOUD_TYPE, REPO, TRUST_REMOTE_CODE, DEBUG, GITHUB_API_TOKEN, RUNPOD_TOKEN):
     runpod.api_key = RUNPOD_TOKEN
     pod = runpod.create_pod(
+        name=f"Eval {MODEL_ID.split('/')[-1]} on {BENCHMARK.capitalize()}",
         image_name="runpod/pytorch:2.0.1-py3.10-cuda11.8.0-devel-ubuntu22.04",
         gpu_type_id=GPU,
         cloud_type=CLOUD_TYPE,
         template_id="au6nz6emhk",
         env={
             "BENCHMARK": BENCHMARK,
+            "MODEL_ID": MODEL_ID,
             "REPO": REPO,
             "TRUST_REMOTE_CODE": TRUST_REMOTE_CODE,
             "DEBUG": DEBUG,
         gr.Textbox("", label="Model", value="mlabonne/NeuralBeagle14-7B", info="ID of the model you want to evaluate", placeholder="mlabonne/NeuralBeagle14-7B"),
         gr.Dropdown(GPU_LIST, label="GPU", value="NVIDIA GeForce RTX 3090", info="Select your GPU to run the evaluation"),
         gr.Slider(minimum=1, maximum=8, value=1, step=1, label="Number of GPUs", info="Number of GPUs to use"),
+        gr.Slider(minimum=50, maximum=500, value=75, step=25, label="Container disk", info="Size of the container disk in GB"),
         gr.Dropdown(["COMMUNITY", "SECURE"], value="COMMUNITY", label="Cloud type", info="Select your cloud type"),
         gr.Textbox("https://github.com/mlabonne/llm-autoeval.git", label="LLM AutoEval repo", info="Link to your LLM AutoEval repo"),
         gr.Checkbox(label="Trust remote code", value=False, info="Required for some models like phi-2"),