Use 1-based indexing for position ids
Browse files
README.md
CHANGED
@@ -42,7 +42,7 @@ past_key_values = {
|
|
42 |
}
|
43 |
input_ids = inputs['input_ids']
|
44 |
attention_mask = inputs['attention_mask']
|
45 |
-
position_ids = np.cumsum(inputs['attention_mask'], axis=-1)
|
46 |
|
47 |
# 3. Generation loop
|
48 |
max_new_tokens = 1024
|
|
|
42 |
}
|
43 |
input_ids = inputs['input_ids']
|
44 |
attention_mask = inputs['attention_mask']
|
45 |
+
position_ids = np.cumsum(inputs['attention_mask'], axis=-1)
|
46 |
|
47 |
# 3. Generation loop
|
48 |
max_new_tokens = 1024
|