govisi commited on
Commit
94d3885
1 Parent(s): f35bb8b
Files changed (1) hide show
  1. app.py +5 -4
app.py CHANGED
@@ -12,11 +12,12 @@ load_dotenv()
12
  bot = commands.Bot("", intents=discord.Intents.all())
13
 
14
  quantized = {
15
- "mode": TORCH_QUANT,
16
  "runtimedtype": torch.float32,
17
  "useGPU": torch.cuda.is_available(),
18
- "chunksize": 32, # larger = more accurate, but more memory
19
- "target": 100 # your gpu max size, excess vram offloaded to cpu
 
20
  }
21
 
22
  # model_pipe = pickle.load(open('pipe.pkl', 'rb'))
@@ -33,7 +34,7 @@ useGPU = torch.cuda.is_available() # False
33
  async def on_ready():
34
  print(f'We have logged in as {bot.user}')
35
  global model
36
- model = RWKV(path="https://huggingface.co/BlinkDL/rwkv-4-pile-1b5/resolve/main/RWKV-4-Pile-1B5-Instruct-test1-20230124.pth",
37
  **quantized)
38
 
39
 
 
12
  bot = commands.Bot("", intents=discord.Intents.all())
13
 
14
  quantized = {
15
+ "mode": TORCH,
16
  "runtimedtype": torch.float32,
17
  "useGPU": torch.cuda.is_available(),
18
+ # "chunksize": 32, # larger = more accurate, but more memory
19
+ # "target": 100, # your gpu max size, excess vram offloaded to cpu
20
+ "dtype": torch.float32
21
  }
22
 
23
  # model_pipe = pickle.load(open('pipe.pkl', 'rb'))
 
34
  async def on_ready():
35
  print(f'We have logged in as {bot.user}')
36
  global model
37
+ model = RWKV(path="https://huggingface.co/BlinkDL/rwkv-4-pile-3b/resolve/main/RWKV-4a-Pile-3B-20230110-8020.pth",
38
  **quantized)
39
 
40