Soumic commited on
Commit
846395b
1 Parent(s): df908e2

:hammer_and_pick: hyenadna ready to deploy

Browse files
Files changed (1) hide show
  1. app.py +8 -5
app.py CHANGED
@@ -245,15 +245,18 @@ def start():
245
  trust_remote_code=True)
246
  args = {
247
  "output_dir": "output_hyena_dna-mqtl_classification",
248
- "num_train_epochs": 1,
249
- "max_steps": 10,
250
  # Set the number of steps you expect to train, originally 1000, takes too much time. So I set it to 10 to run faster and check my code/pipeline
251
  "run_name": "laptop_run_hyena_dna-mqtl_classification", # Override run_name here
252
  "per_device_train_batch_size": 1,
253
- "gradient_accumulation_steps": 4,
254
  "gradient_checkpointing": True,
255
- "learning_rate": 2e-5,
256
- "save_safetensors": False # I added it. this solves the runtime error!
 
 
 
257
  }
258
 
259
  # """
 
245
  trust_remote_code=True)
246
  args = {
247
  "output_dir": "output_hyena_dna-mqtl_classification",
248
+ "num_train_epochs": 10,
249
+ "max_steps": 40_000, # train 36k + val 4k = 40k
250
  # Set the number of steps you expect to train, originally 1000, takes too much time. So I set it to 10 to run faster and check my code/pipeline
251
  "run_name": "laptop_run_hyena_dna-mqtl_classification", # Override run_name here
252
  "per_device_train_batch_size": 1,
253
+ "gradient_accumulation_steps": 32,
254
  "gradient_checkpointing": True,
255
+ "learning_rate": 1e-3,
256
+ "save_safetensors": False, # I added it. this solves the runtime error!
257
+ # not sure if it is a good idea. sklearn may slow down training, causing time loss... if so, disable these 2 lines below
258
+ "evaluation_strategy": "epoch", # To calculate metrics per epoch
259
+ "logging_strategy": "epoch" # Extra: to log training data stats for loss
260
  }
261
 
262
  # """