kaz-llm-lb

Running

App Files Files Community

hi-melnikov commited on May 19

Commit

9358ac6

•

1 Parent(s): 8e67ebe

Removing model download to check GUI

Browse files

Files changed (3) hide show

app.py +7 -13
src/scripts/update_all_request_files.py +2 -5
update_dynamic.py +2 -0

app.py CHANGED Viewed

@@ -7,7 +7,6 @@ import time
 import gradio as gr
 import pandas as pd
 from apscheduler.schedulers.background import BackgroundScheduler
-from gradio_leaderboard import Leaderboard, SelectColumns
 from gradio_space_ci import enable_space_ci
 from huggingface_hub import snapshot_download
@@ -18,11 +17,6 @@ from src.display.about import (
     TITLE,
 )
 from src.display.css_html_js import custom_css
-from src.display.utils import (
-    # BENCHMARK_COLS,
-    AutoEvalColumn,
-    fields,
-)
 from src.envs import (
     API,
     EVAL_RESULTS_PATH,
@@ -87,8 +81,8 @@ def init_space(full_init: bool = True):
             # download_dataset(DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH)
             download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
             # print(subprocess.Popen('ls src'))
-            subprocess.run(['rsync', '-avzP', '--ignore-existing', f'{EVAL_RESULTS_PATH[2:]}/external/*', 'src/gen/data/arena-hard-v0.1/model_answer/'])
-            subprocess.run(['rsync', '-avzP', '--ignore-existing', f'{EVAL_RESULTS_PATH[2:]}/model_judgment/*', 'src/gen/data/arena-hard-v0.1/model_judgement/'])
         # except Exception:
         #     restart_space()
@@ -98,7 +92,6 @@ def init_space(full_init: bool = True):
     leaderboard_df = original_df.copy()
     return leaderboard_df
 # Convert the environment variable "LEADERBOARD_FULL_INIT" to a boolean value, defaulting to True if the variable is not set.
@@ -107,7 +100,7 @@ do_full_init = os.getenv("LEADERBOARD_FULL_INIT", "True") == "True"
 # Calls the init_space function with the `full_init` parameter determined by the `do_full_init` variable.
 # This initializes various DataFrames used throughout the application, with the level of initialization detail controlled by the `do_full_init` flag.
-leaderboard_df = init_space(full_init=do_full_init)
 demo = gr.Blocks(css=custom_css)
 with demo:
@@ -117,6 +110,7 @@ with demo:
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 LLM Benchmark", elem_id="llm-benchmark-tab-table", id=0):
             pass
             leaderboard = Leaderboard(
                 value=leaderboard_df,
                 datatype=[c.type for c in fields(AutoEvalColumn)],
@@ -135,6 +129,7 @@ with demo:
                     # AutoEvalColumn.license.name
                 ],
             )
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=3):
@@ -151,9 +146,8 @@ with demo:
             with gr.Column():
                     model_name_textbox = gr.Textbox(label="Model name")
                     def upload_file(file):
-                        print(file.name)
                         file_path = file.name.split('/')[-1] if '/' in file.name else file.name
-                        print(file_path)
                         API.upload_file(path_or_fileobj=file.name,path_in_repo='./external/'+file_path,repo_id='Vikhrmodels/openbench-eval',repo_type='dataset')
                         os.environ[RESET_JUDGEMENT_ENV] = '1'
@@ -173,7 +167,7 @@ def update_board():
     os.environ[RESET_JUDGEMENT_ENV] = '0'
-    subprocess.run(['python','../gen/gen_judgement.py'])
     subprocess.Popen('python3 ../gen/show_result.py --output')

 import gradio as gr
 import pandas as pd
 from apscheduler.schedulers.background import BackgroundScheduler
 from gradio_space_ci import enable_space_ci
 from huggingface_hub import snapshot_download
     TITLE,
 )
 from src.display.css_html_js import custom_css
 from src.envs import (
     API,
     EVAL_RESULTS_PATH,
             # download_dataset(DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH)
             download_dataset("Vikhrmodels/openbench-eval", EVAL_RESULTS_PATH)
             # print(subprocess.Popen('ls src'))
+            subprocess.run(['rsync', '-avzP', '--ignore-existing', f'{EVAL_RESULTS_PATH[2:]}/external/*', 'src/gen/data/arena-hard-v0.1/model_answer/'], check=False)
+            subprocess.run(['rsync', '-avzP', '--ignore-existing', f'{EVAL_RESULTS_PATH[2:]}/model_judgment/*', 'src/gen/data/arena-hard-v0.1/model_judgement/'], check=False)
         # except Exception:
         #     restart_space()
     leaderboard_df = original_df.copy()
     return leaderboard_df
 # Convert the environment variable "LEADERBOARD_FULL_INIT" to a boolean value, defaulting to True if the variable is not set.
 # Calls the init_space function with the `full_init` parameter determined by the `do_full_init` variable.
 # This initializes various DataFrames used throughout the application, with the level of initialization detail controlled by the `do_full_init` flag.
+# leaderboard_df = init_space(full_init=do_full_init)
 demo = gr.Blocks(css=custom_css)
 with demo:
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 LLM Benchmark", elem_id="llm-benchmark-tab-table", id=0):
             pass
+            """
             leaderboard = Leaderboard(
                 value=leaderboard_df,
                 datatype=[c.type for c in fields(AutoEvalColumn)],
                     # AutoEvalColumn.license.name
                 ],
             )
+            """
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=3):
             with gr.Column():
                     model_name_textbox = gr.Textbox(label="Model name")
                     def upload_file(file):
                         file_path = file.name.split('/')[-1] if '/' in file.name else file.name
+                        logging.info("New submition: file saved to %s", file_path)
                         API.upload_file(path_or_fileobj=file.name,path_in_repo='./external/'+file_path,repo_id='Vikhrmodels/openbench-eval',repo_type='dataset')
                         os.environ[RESET_JUDGEMENT_ENV] = '1'
     os.environ[RESET_JUDGEMENT_ENV] = '0'
+    subprocess.run(['python','../gen/gen_judgement.py'], check = False)
     subprocess.Popen('python3 ../gen/show_result.py --output')

src/scripts/update_all_request_files.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import json
 import os
-import time
-from huggingface_hub import snapshot_download
-from src.envs import API, DYNAMIC_INFO_FILE_PATH, DYNAMIC_INFO_PATH, DYNAMIC_INFO_REPO, EVAL_REQUESTS_PATH, H4_TOKEN
 from src.submission.check_validity import check_model_card, get_model_tags, is_model_on_hub
@@ -93,7 +91,6 @@ def update_models(file_path, models_on_the_hub):
 def update_dynamic_files():
     # from gen import gen_answer,gen_judgment\
-    import subprocess
     subprocess.Popen('python3 ../gen/gen_judgement.py')
     subprocess.Popen('python3 ../gen/show_result.py --output')

 import json
 import os
+import subprocess
+from src.envs import EVAL_REQUESTS_PATH, H4_TOKEN
 from src.submission.check_validity import check_model_card, get_model_tags, is_model_on_hub
 def update_dynamic_files():
     # from gen import gen_answer,gen_judgment\
     subprocess.Popen('python3 ../gen/gen_judgement.py')
     subprocess.Popen('python3 ../gen/show_result.py --output')

update_dynamic.py CHANGED Viewed

@@ -1,4 +1,6 @@
 from src.scripts.update_all_request_files import update_dynamic_files
 if __name__ == "__main__":
     update_dynamic_files()

 from src.scripts.update_all_request_files import update_dynamic_files
 if __name__ == "__main__":
+    print("Updating dynamic files")
+    # Pretty sure this will never be called
     update_dynamic_files()