Skip to content

Commit

Permalink
.
Browse files Browse the repository at this point in the history
  • Loading branch information
www committed Jul 1, 2024
1 parent 06aa1d4 commit 7b23d3b
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions API_DEMO_CHAT.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@
torch.backends.cudnn.allow_tf32 = True
torch.backends.cuda.matmul.allow_tf32 = True
os.environ["RWKV_JIT_ON"] = "1"
os.environ["RWKV_CUDA_ON"] = "0" # '1' to compile CUDA kernel (10x faster), requires c++ compiler & cuda libraries
os.environ["RWKV_CUDA_ON"] = "1" # '1' to compile CUDA kernel (10x faster), requires c++ compiler & cuda libraries

from rwkv.model import RWKV
from rwkv.utils import PIPELINE
Expand All @@ -24,7 +24,7 @@

args.strategy = "cuda fp16" # use CUDA, fp16

args.MODEL_NAME = "E://RWKV-Runner//models//RWKV-5-World-1B5-v2-20231025-ctx4096"
args.MODEL_NAME = "E://RWKV-Runner//models//rwkv-final-v6-2.1-7b"

GEN_TEMP = 1.0
GEN_TOP_P = 0.3
Expand Down

0 comments on commit 7b23d3b

Please sign in to comment.