n1ck-guo commited on
Commit
d56aebd
1 Parent(s): 08450d6

support for autoround type

Browse files

Signed-off-by: n1ck-guo <heng.guo@intel.com>

src/leaderboard/read_evals.py CHANGED
@@ -2,6 +2,7 @@ import glob
2
  import json
3
  import math
4
  import os
 
5
  from dataclasses import dataclass
6
 
7
  import dateutil
@@ -145,6 +146,7 @@ class EvalResult:
145
  except Exception as e:
146
  self.status = "Failed"
147
  print(f"Could not find request file for {self.org}/{self.model}")
 
148
 
149
  def update_with_dynamic_file_dict(self, file_dict):
150
  self.license = file_dict.get("license", "?")
 
2
  import json
3
  import math
4
  import os
5
+ import traceback
6
  from dataclasses import dataclass
7
 
8
  import dateutil
 
146
  except Exception as e:
147
  self.status = "Failed"
148
  print(f"Could not find request file for {self.org}/{self.model}")
149
+ print(traceback.format_exc())
150
 
151
  def update_with_dynamic_file_dict(self, file_dict):
152
  self.license = file_dict.get("license", "?")
src/submission/submit.py CHANGED
@@ -148,6 +148,10 @@ def add_new_eval(
148
  in_group_size = quantization_config.get('in_group_size')
149
  bits = int(nbits_per_codebook * num_codebooks / in_group_size)
150
  precision = f"{bits}bit"
 
 
 
 
151
 
152
  if precision == "4bit":
153
  weight_dtype = "int4"
 
148
  in_group_size = quantization_config.get('in_group_size')
149
  bits = int(nbits_per_codebook * num_codebooks / in_group_size)
150
  precision = f"{bits}bit"
151
+ if "auto-round" in quant_method:
152
+ hardware = "gpu"
153
+ quant_type = "AutoRound"
154
+ precision = f"{quantization_config.get('bits', '4bit')}bit"
155
 
156
  if precision == "4bit":
157
  weight_dtype = "int4"