Cyrile commited on
Commit
1ac2b83
·
verified ·
1 Parent(s): fd39e84

Upload TextClassificationPipeline

Browse files
Files changed (3) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. tokenizer_config.json +4 -0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "../models/EuroBERT-210m-Quality/",
3
  "architectures": [
4
  "EuroBertForSequenceClassification"
5
  ],
@@ -50,7 +50,7 @@
50
  "rope_scaling": null,
51
  "rope_theta": 250000,
52
  "tie_word_embeddings": false,
53
- "torch_dtype": "bfloat16",
54
  "transformers_version": "4.49.0",
55
  "use_cache": false,
56
  "vocab_size": 128256
 
1
  {
2
+ "_name_or_path": "../models/EuroBERT-210m-Quality",
3
  "architectures": [
4
  "EuroBertForSequenceClassification"
5
  ],
 
50
  "rope_scaling": null,
51
  "rope_theta": 250000,
52
  "tie_word_embeddings": false,
53
+ "torch_dtype": "float32",
54
  "transformers_version": "4.49.0",
55
  "use_cache": false,
56
  "vocab_size": 128256
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd9f995bacb9411087ac6f3cb7ec4d76b453395edf81d6e181e27110c255b997
3
- size 424732032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5a81d5c4bded815a646aaa8861079b54756628c0b8e9eea82cdf5010a9af8ec
3
+ size 849451288
tokenizer_config.json CHANGED
@@ -2055,11 +2055,15 @@
2055
  "eos_token": "<|end_of_text|>",
2056
  "extra_special_tokens": {},
2057
  "mask_token": "<|mask|>",
 
2058
  "model_input_names": [
2059
  "input_ids",
2060
  "attention_mask"
2061
  ],
2062
  "model_max_length": 1000000000000000019884624838656,
 
2063
  "pad_token": "<|end_of_text|>",
 
 
2064
  "tokenizer_class": "PreTrainedTokenizer"
2065
  }
 
2055
  "eos_token": "<|end_of_text|>",
2056
  "extra_special_tokens": {},
2057
  "mask_token": "<|mask|>",
2058
+ "max_length": 512,
2059
  "model_input_names": [
2060
  "input_ids",
2061
  "attention_mask"
2062
  ],
2063
  "model_max_length": 1000000000000000019884624838656,
2064
+ "pad_to_multiple_of": null,
2065
  "pad_token": "<|end_of_text|>",
2066
+ "pad_token_type_id": 0,
2067
+ "padding_side": "right",
2068
  "tokenizer_class": "PreTrainedTokenizer"
2069
  }