File size: 2,247 Bytes
08ae6c5
95c19d6
 
 
 
 
 
 
2a5f9fb
8b88d2c
a49910a
5ea4d55
 
8b88d2c
 
95c19d6
 
252b09c
8c49cb6
8b88d2c
95c19d6
2a73469
252b09c
1ffc326
8b88d2c
 
95c19d6
 
 
 
 
af9288c
95c19d6
 
 
 
 
8b88d2c
d084b26
95c19d6
 
 
 
 
 
 
8b88d2c
95c19d6
8b88d2c
95c19d6
 
 
 
 
 
 
 
 
6bc96ff
8c49cb6
95c19d6
 
 
8b88d2c
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
import logging
from src.logging import configure_root_logger
logging.getLogger("httpx").setLevel(logging.WARNING)
logging.getLogger("numexpr").setLevel(logging.WARNING)
logging.getLogger("absl").setLevel(logging.WARNING)
configure_root_logger()

from functools import partial

import gradio as gr
#from main_backend_lighteval import run_auto_eval
#from main_backend_harness import run_auto_eval
from main_backend_toxicity import run_auto_eval
from src.display.log_visualizer import log_file_to_html_string
from src.display.css_html_js import dark_mode_gradio_js
from src.envs import REFRESH_RATE, REPO_ID, QUEUE_REPO, RESULTS_REPO
from src.logging import setup_logger, log_file
from lm_eval import tasks

logging.basicConfig(level=logging.INFO)
logger = setup_logger(__name__)

print(tasks.__dict__)

intro_md = f"""
# Intro
This is a visual for the auto evaluator. 
"""

links_md = f"""
# Important links

| Description     | Link |
|-----------------|------|
| Leaderboard     | [{REPO_ID}](https://huggingface.co/spaces/{REPO_ID}) |
| Queue Repo      | [{QUEUE_REPO}](https://huggingface.co/datasets/{QUEUE_REPO}) |
| Results Repo    | [{RESULTS_REPO}](https://huggingface.co/datasets/{RESULTS_REPO}) |
"""

def button_auto_eval():
    logger.info("Manually triggering Auto Eval")
    run_auto_eval()


reverse_order_checkbox = gr.Checkbox(label="Reverse Order", value=True)

with gr.Blocks(js=dark_mode_gradio_js) as demo:
    gr.Markdown(intro_md)
    with gr.Tab("Application"):
        output_html = gr.HTML(partial(log_file_to_html_string, reverse=reverse_order_checkbox), every=1)
        with gr.Row():
            download_button = gr.DownloadButton("Download Log File", value=log_file)
            with gr.Accordion('Log View Configuration', open=False):
                reverse_order_checkbox.render()
        # Add a button that when pressed, triggers run_auto_eval
        button = gr.Button("Manually Run Evaluation")
        gr.Markdown(links_md)

        dummy = gr.Markdown(run_auto_eval, every=REFRESH_RATE, visible=False)

        button.click(fn=button_auto_eval, inputs=[], outputs=[])


if __name__ == '__main__':
    demo.queue(default_concurrency_limit=40).launch(server_name="0.0.0.0", show_error=True, server_port=7860)