backend / app.py
meg's picture
meg HF staff
Update app.py
252b09c verified
raw
history blame
2.2 kB
import logging
from src.logging import configure_root_logger
logging.getLogger("httpx").setLevel(logging.WARNING)
logging.getLogger("numexpr").setLevel(logging.WARNING)
logging.getLogger("absl").setLevel(logging.WARNING)
configure_root_logger()
from functools import partial
import gradio as gr
#from main_backend_lighteval import run_auto_eval
from main_backend_harness import run_auto_eval
from src.display.log_visualizer import log_file_to_html_string
from src.display.css_html_js import dark_mode_gradio_js
from src.envs import REFRESH_RATE, REPO_ID, QUEUE_REPO, RESULTS_REPO
from src.logging import setup_logger, log_file
from lm_eval import tasks
logging.basicConfig(level=logging.INFO)
logger = setup_logger(__name__)
print(tasks.__dict__)
intro_md = f"""
# Intro
This is a visual for the auto evaluator.
"""
links_md = f"""
# Important links
| Description | Link |
|-----------------|------|
| Leaderboard | [{REPO_ID}](https://huggingface.co/spaces/{REPO_ID}) |
| Queue Repo | [{QUEUE_REPO}](https://huggingface.co/datasets/{QUEUE_REPO}) |
| Results Repo | [{RESULTS_REPO}](https://huggingface.co/datasets/{RESULTS_REPO}) |
"""
def button_auto_eval():
logger.info("Manually triggering Auto Eval")
run_auto_eval()
reverse_order_checkbox = gr.Checkbox(label="Reverse Order", value=True)
with gr.Blocks(js=dark_mode_gradio_js) as demo:
gr.Markdown(intro_md)
with gr.Tab("Application"):
output_html = gr.HTML(partial(log_file_to_html_string, reverse=reverse_order_checkbox), every=1)
with gr.Row():
download_button = gr.DownloadButton("Download Log File", value=log_file)
with gr.Accordion('Log View Configuration', open=False):
reverse_order_checkbox.render()
# Add a button that when pressed, triggers run_auto_eval
button = gr.Button("Manually Run Evaluation")
gr.Markdown(links_md)
dummy = gr.Markdown(run_auto_eval, every=REFRESH_RATE, visible=False)
button.click(fn=button_auto_eval, inputs=[], outputs=[])
if __name__ == '__main__':
demo.queue(default_concurrency_limit=40).launch(server_name="0.0.0.0", show_error=True, server_port=7860)