JerryLiJinyi's picture
Upload app.py
8f819b8 verified
raw
history blame
3.1 kB
import gradio as gr
from compressor import PromptCompressor
import os
res = os.popen('python -m spacy download en_core_web_sm').read()
print(res)
def compressit(original_text, compressor1, ratio, maxlength):
if compressor1=="Selective Context":
compressor = PromptCompressor(type='SCCompressor', lang='en', model='gpt2', device='cpu')
elif compressor1=="LLMLingua":
return "Sorry, currently we cannot provide services for LLMLingua due to the Huggingface Token issue. Please try other compressors."
elif compressor1=="LongLLMLingua":
return "Sorry, currently we cannot provide services for LongLLMLingua due to the Huggingface Token issue. Please try other compressors."
elif compressor1=="SCRL":
compressor = PromptCompressor(type='SCRLCompressor', model_dir="models/gigaword-L8/", device="cpu", tokenizer_dir="sentence-transformers/paraphrase-distilroberta-base-v2")
elif compressor1=="KiS":
compressor = PromptCompressor(type='KiSCompressor', device="cpu", model_dir="philippelaban/keep_it_simple")
else:
compressor = PromptCompressor(type='SCCompressor', lang='en', model='gpt2', device='cpu')
if compressor1 == "Selective Context":
compressed_prompt = compressor.compressgo(original_prompt=original_text, ratio=float(ratio))
else:
if maxlength:
compressed_prompt = compressor.compressgo(original_prompt=original_text, ratio=float(ratio), max_length=int(maxlength))
else:
gr.Warning("max_length is needed for this type of compressor. Please fill in and try again.")
return "max_length is missing."
gr.Warning("The prompt is generating, please wait patiently as it may take a long time to generate during busy hours.")
return compressed_prompt["compressed_prompt"], compressed_prompt["ratio"]
demo = gr.Interface(
fn=compressit,
inputs=[
gr.Textbox(lines=2, placeholder="Enter your prompt here...", label="input", info="Enter the original prompt here."),
gr.Dropdown(
["Selective Context", "LLMLingua", "LongLLMLingua", "SCRL", "KiS"], label="compressor", info="Choose your compressor here. \n Currently, we cannot support the online demo for LLMLingua and LongLLMLingua due to the Huggingface Token issue."
),
gr.Textbox(lines=1, placeholder="Enter the compression ratio here...", info="Ratio only works for Selective Context, LLMLingua and LongLLMLingua."),
gr.Textbox(lines=1, placeholder="Enter the max_length parameter (integer) if you are using SCRL or KiS", label="max_length", info="If you are using SCRL or KiS, fill in the parameter, if not, just ignore this.\n Hint: For SCRL, max_length should be shorter than the lenght of original prompt; For KiS, max_length should be longer than it.")
],
outputs=[
gr.Textbox(lines=1, info="Please wait patiently when proceeding it may take more than 2 minutes to generate since we are using CPUs for free."),
gr.Textbox(lines=1, info="With the compression ratio of: ")
]
)
demo.launch(share=False)