SmerkyG
/

rwkv-5-world-1b5

Text Generation

Model card Files Files and versions

SmerkyG commited on Mar 23, 2024

Commit

d420145

·

verified ·

1 Parent(s): 2b07ca9

Update modeling_rwkv5.py

Files changed (1) hide show

modeling_rwkv5.py +4 -1

modeling_rwkv5.py CHANGED Viewed

@@ -789,7 +789,10 @@ class Rwkv5ForCausalLM(Rwkv5PreTrainedModel):
         # only last token for inputs_ids if the state is passed along.
         if state is not None:
             input_ids = input_ids[:, -1].unsqueeze(-1)
         # if `inputs_embeds` are passed, we only want to use them in the 1st generation step
         if inputs_embeds is not None and state is None:
             model_inputs = {"inputs_embeds": inputs_embeds}

         # only last token for inputs_ids if the state is passed along.
         if state is not None:
             input_ids = input_ids[:, -1].unsqueeze(-1)
+        else:
+            # add in \n at the beginning
+            input_ids = torch.cat([torch.full([1,1],11,device=input_ids.device,dtype=input_ids.dtype), input_ids])
         # if `inputs_embeds` are passed, we only want to use them in the 1st generation step
         if inputs_embeds is not None and state is None:
             model_inputs = {"inputs_embeds": inputs_embeds}