Update README.md
Browse files
README.md
CHANGED
@@ -1,5 +1,11 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
4 |
|
5 |
# Model Description
|
@@ -109,16 +115,13 @@ write_dist_matrix(dist_matrix, max_dist, output_data_filename_, verbose=True)
|
|
109 |
end = time.perf_counter()
|
110 |
"""
|
111 |
|
112 |
-
tokenizer = AutoTokenizer.from_pretrained('
|
113 |
-
model = AutoModelForCausalLM.from_pretrained('
|
114 |
encoded_input = tokenizer(example, return_tensors='pt', return_token_type_ids=False)
|
115 |
input_len = len(encoded_input["input_ids"][0])
|
116 |
out = model.generate(
|
117 |
**encoded_input,
|
118 |
max_new_tokens=100,
|
119 |
-
num_beams=1,
|
120 |
-
pad_token_id=tokenizer.eos_token_id,
|
121 |
-
eos_token_id=tokenizer.eos_token_id,
|
122 |
)
|
123 |
print("### Context")
|
124 |
print(tokenizer.decode(out[0][:input_len]))
|
@@ -138,4 +141,4 @@ If you use this model, please cite:
|
|
138 |
```
|
139 |
|
140 |
# Contact
|
141 |
-
For questions, collaborations and requests reach us out via [email protected]
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
+
datasets:
|
4 |
+
- bigcode/the-stack
|
5 |
+
- bigcode/the-stack-v2
|
6 |
+
- bigcode/starcoderdata
|
7 |
+
- bigcode/commitpack
|
8 |
+
library_name: transformers
|
9 |
---
|
10 |
|
11 |
# Model Description
|
|
|
115 |
end = time.perf_counter()
|
116 |
"""
|
117 |
|
118 |
+
tokenizer = AutoTokenizer.from_pretrained('JetBrains/Mellum-4b-base')
|
119 |
+
model = AutoModelForCausalLM.from_pretrained('JetBrains/Mellum-4b-base')
|
120 |
encoded_input = tokenizer(example, return_tensors='pt', return_token_type_ids=False)
|
121 |
input_len = len(encoded_input["input_ids"][0])
|
122 |
out = model.generate(
|
123 |
**encoded_input,
|
124 |
max_new_tokens=100,
|
|
|
|
|
|
|
125 |
)
|
126 |
print("### Context")
|
127 |
print(tokenizer.decode(out[0][:input_len]))
|
|
|
141 |
```
|
142 |
|
143 |
# Contact
|
144 |
+
For questions, collaborations and requests reach us out via [email protected]
|