Skip to content

Commit

Permalink
.
Browse files Browse the repository at this point in the history
  • Loading branch information
www committed May 9, 2024
1 parent 89bd9ad commit 3d65c52
Showing 1 changed file with 2 additions and 0 deletions.
2 changes: 2 additions & 0 deletions RWKV_v6_demo_cuda_bf16.py
Original file line number Diff line number Diff line change
Expand Up @@ -121,6 +121,7 @@ def sample_logits(out, temperature=1.0, top_p=0.8):
args.n_layer = 32
args.n_embd = 2560
args.vocab_size = 65536
args.head_size = 64

context = "\nElon Musk's favorite"
# context = "\n北京"
Expand All @@ -145,6 +146,7 @@ def __init__(self, args):

self.n_head = w['blocks.0.att.time_faaaa'].shape[0]
self.head_size = w['blocks.0.ln1.weight'].shape[0] // self.n_head
assert self.head_size == args.head_size

self.w = types.SimpleNamespace() # set self.w from w
self.w.blocks = {}
Expand Down

0 comments on commit 3d65c52

Please sign in to comment.