Skip to content

Commit

Permalink
fix
Browse files Browse the repository at this point in the history
  • Loading branch information
www committed Feb 3, 2024
1 parent 901f268 commit 4caa6e9
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions API_DEMO_CHAT.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,9 @@
torch.backends.cudnn.benchmark = True
torch.backends.cudnn.allow_tf32 = True
torch.backends.cuda.matmul.allow_tf32 = True
os.environ["RWKV_JIT_ON"] = "1"
os.environ["RWKV_CUDA_ON"] = "0" # '1' to compile CUDA kernel (10x faster), requires c++ compiler & cuda libraries

from rwkv.model import RWKV
from rwkv.utils import PIPELINE

Expand All @@ -20,8 +23,6 @@
args = types.SimpleNamespace()

args.strategy = "cuda fp16" # use CUDA, fp16
os.environ["RWKV_JIT_ON"] = "1"
os.environ["RWKV_CUDA_ON"] = "0" # '1' to compile CUDA kernel (10x faster), requires c++ compiler & cuda libraries

args.MODEL_NAME = "E://RWKV-Runner//models//RWKV-5-World-1B5-v2-20231025-ctx4096"

Expand Down

0 comments on commit 4caa6e9

Please sign in to comment.