journalism_config_space / pages /4_πŸ” Review Generated Data.py
Ben Burtenshaw
fix push from argilla
9675a52
raw
history blame
1.64 kB
import streamlit as st
from defaults import PROJECT_NAME, ARGILLA_URL, DATASET_REPO_ID
from utils import project_sidebar
from hub import push_argilla_dataset_to_hub
st.set_page_config(
page_title="Domain Data Grower",
page_icon="πŸ§‘β€πŸŒΎ",
)
project_sidebar()
################################################################################
# HEADER
################################################################################
st.header("πŸ§‘β€πŸŒΎ Domain Data Grower")
st.divider()
st.write(
"""Once you have reviewed the synthetic data in Argilla, you can publish the
generated dataset to the Hub."""
)
################################################################################
# Configuration
################################################################################
st.divider()
st.write("πŸ”¬ Argilla API details to push the generated dataset")
argilla_url = st.text_input("Argilla API URL", ARGILLA_URL)
argilla_api_key = st.text_input("Argilla API Key", "owner.apikey")
argilla_dataset_name = st.text_input("Argilla Dataset Name", PROJECT_NAME)
dataset_repo_id = st.text_input("Dataset Repo ID", DATASET_REPO_ID)
st.divider()
if st.button("πŸš€ Publish the generated dataset"):
with st.spinner("Publishing the generated dataset..."):
push_argilla_dataset_to_hub(
name=argilla_dataset_name,
repo_id=dataset_repo_id,
url=argilla_url,
api_key=argilla_api_key,
workspace="admin",
hub_token=st.session_state["hub_token"],
)
st.success("The generated dataset has been published to the Hub.")