gchhablani commited on
Commit
d74c94a
·
1 Parent(s): c84beda

Add other generation parameters

Browse files
Files changed (1) hide show
  1. app.py +7 -4
app.py CHANGED
@@ -44,11 +44,11 @@ code_to_name = {
44
  }
45
 
46
  @st.cache
47
- def generate_sequence(pixel_values, lang_code, num_beams, temperature, top_p):
48
  lang_code = language_mapping[lang_code]
49
- output_ids = state.model.generate(input_ids=pixel_values, forced_bos_token_id=tokenizer.lang_code_to_id[lang_code], max_length=64, num_beams=num_beams, temperature=temperature, top_p = top_p)
50
  print(output_ids)
51
- output_sequence = tokenizer.batch_decode(output_ids[0], skip_special_tokens=True, max_length=64)
52
  return output_sequence
53
 
54
  def read_markdown(path, parent="./sections/"):
@@ -72,6 +72,9 @@ st.write(
72
  )
73
 
74
  st.sidebar.title("Generation Parameters")
 
 
 
75
  num_beams = st.sidebar.number_input(label="Number of Beams", min_value=2, max_value=10, value=4, step=1, help="Number of beams to be used in beam search.")
76
  temperature = st.sidebar.select_slider(label="Temperature", options = list(np.arange(0.0,1.1, step=0.1)), value=1.0, help ="The value used to module the next token probabilities.", format_func=lambda x: f"{x:.2f}")
77
  top_p = st.sidebar.select_slider(label = "Top-P", options = list(np.arange(0.0,1.1, step=0.1)),value=1.0, help="Nucleus Sampling : If set to float < 1, only the most probable tokens with probabilities that add up to :obj:`top_p` or higher are kept for generation.", format_func=lambda x: f"{x:.2f}")
@@ -150,7 +153,7 @@ lang_id = new_col2.selectbox(
150
  sequence = ['']
151
  if new_col2.button("Generate Caption", help="Generate a caption in the specified language."):
152
  with st.spinner("Generating Sequence..."):
153
- sequence = generate_sequence(transformed_image, lang_id, num_beams, temperature, top_p)
154
  # print(sequence)
155
 
156
  if sequence!=['']:
 
44
  }
45
 
46
  @st.cache
47
+ def generate_sequence(pixel_values, lang_code, num_beams, temperature, top_p, do_sample, top_k, max_length):
48
  lang_code = language_mapping[lang_code]
49
+ output_ids = state.model.generate(input_ids=pixel_values, forced_bos_token_id=tokenizer.lang_code_to_id[lang_code], max_length=max_length, num_beams=num_beams, temperature=temperature, top_p = top_p, top_k=top_k, do_sample=do_sample)
50
  print(output_ids)
51
+ output_sequence = tokenizer.batch_decode(output_ids[0], skip_special_tokens=True, max_length=max_length)
52
  return output_sequence
53
 
54
  def read_markdown(path, parent="./sections/"):
 
72
  )
73
 
74
  st.sidebar.title("Generation Parameters")
75
+ max_length = st.sidebar.number_input("Max Length", min_value=16, max_value=128, value=64, step=1, help="The maximum length of sequence to be generated.")
76
+ do_sample = st.sidebar.checkbox("Sample", value=False, help="Sample from the model instead of using beam search.")
77
+ top_k = st.sidebar.number_input("Top K", min_value=10, max_value=200, value=50, step=1, help="The number of highest probability vocabulary tokens to keep for top-k-filtering.")
78
  num_beams = st.sidebar.number_input(label="Number of Beams", min_value=2, max_value=10, value=4, step=1, help="Number of beams to be used in beam search.")
79
  temperature = st.sidebar.select_slider(label="Temperature", options = list(np.arange(0.0,1.1, step=0.1)), value=1.0, help ="The value used to module the next token probabilities.", format_func=lambda x: f"{x:.2f}")
80
  top_p = st.sidebar.select_slider(label = "Top-P", options = list(np.arange(0.0,1.1, step=0.1)),value=1.0, help="Nucleus Sampling : If set to float < 1, only the most probable tokens with probabilities that add up to :obj:`top_p` or higher are kept for generation.", format_func=lambda x: f"{x:.2f}")
 
153
  sequence = ['']
154
  if new_col2.button("Generate Caption", help="Generate a caption in the specified language."):
155
  with st.spinner("Generating Sequence..."):
156
+ sequence = generate_sequence(transformed_image, lang_id, num_beams, temperature, top_p, do_sample, top_k, max_length)
157
  # print(sequence)
158
 
159
  if sequence!=['']: