spl4shedEdu commited on
Commit
6bdc600
·
verified ·
1 Parent(s): 552629d

Upload model checkpoint

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
README.md ADDED
@@ -0,0 +1,443 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: sentence-transformers/all-mpnet-base-v2
3
+ datasets: []
4
+ language: []
5
+ library_name: sentence-transformers
6
+ pipeline_tag: sentence-similarity
7
+ tags:
8
+ - sentence-transformers
9
+ - sentence-similarity
10
+ - feature-extraction
11
+ - generated_from_trainer
12
+ - dataset_size:269761
13
+ - loss:CachedMultipleNegativesRankingLoss
14
+ widget:
15
+ - source_sentence: mohawk industries mqrt01425 72 inch rustic suede hickory laminate
16
+ quarter round mqrt01425 cork bamboo tile more stepco nuvelle high gloss flooring
17
+ sale hardwood mohawk industries toolsandhomeimprovement
18
+ sentences:
19
+ - nokya heavy duty headlight harnesses high beam 0305 toyota mrs mrs 9005hb3 or
20
+ as complete upgrades a precautionary measure against harness plug burnouts which
21
+ can permanently damage your toyota mrs headlight housings these heavy duty headlight
22
+ high beam 9005 wire harnesses also help to handle the increased demands of aftermarket
23
+ bulbs nokya offers these harnesses cheap and relatively easy upgrade stock electrical
24
+ system they work replacements for damaged plugs lighting are not designed extended
25
+ periods use operation in adverse severe conditions to address this brand otherwise
26
+ each set consists 2 harnesses these have been be plugged into mrss wiring aftermarket
27
+ automotive
28
+ - mohawk industries mqrt01425 72 inch rustic suede hickory laminate quarter round
29
+ mqrt01425 cork bamboo tile mincp01425 barrington 846quot instaform profile sale
30
+ hardwood mohawk industries toolsandhomeimprovement
31
+ - fuel hose 120 x 170 mm outside cloth braided 1994 bmw 318i base convertible fuel
32
+ system page 1 note working pressure 7 bar sold by the meter cohline automotive
33
+ - source_sentence: camshaft adapter ignition rotor 1988 bmw 325i base sedan camshafts
34
+ timing chains page 1 genuine bmw automotive
35
+ sentences:
36
+ - needle nose pliers 40 deg angled 8 in length 1980 bmw 320i base coupe tools page
37
+ 6 note with cutter distortiontolerant elastic precision tips halfround long pointed
38
+ jaws vanadium electric steel forged oilhardened black atramentized finish with
39
+ polished head plastic coated handles knipex toolsandhomeimprovement
40
+ - spyder cold air intake system black 9802 honda accord 30l v6 high flow washable
41
+ reusable stainless steel air filter spyder honda accord black cold air intake
42
+ system helps to draw more and colder your engine than stock box setup this spyder
43
+ kit will give you approximately 510 horsepower increase your results may vary
44
+ but the sound definitely be intense comes with aluminum intake pipe pressure silicon
45
+ hose mounting accessories automotive
46
+ - camshaft adapter ignition rotor 1988 bmw 325i base convertible camshafts timing
47
+ chains page 1 genuine bmw automotive
48
+ - source_sentence: premium underlayment 100 sq ft cork bamboo tile more amtico premium
49
+ pressplate 12 x new bronze vinyl flooring sale hardwood premium underlayment 100
50
+ sq ft bellawood toolsandhomeimprovement
51
+ sentences:
52
+ - spray flat clear ts80 100ml paints and tools clearcoats new products spotmodel
53
+ tamiya toolsandhomeimprovement
54
+ - seasucker mini bomber 2bike forkmount rack with 2 rear wheel straps 1975 bmw 2002
55
+ base coupe exterior trim page 3 automotive
56
+ - premium underlayment 100 sq ft cork bamboo tile mo armstrong flooring 52157 clay
57
+ red commercial vinyl composition stonetex premium excelon sale hardwood premium
58
+ underlayment 100 sq ft bellawood toolsandhomeimprovement
59
+ - source_sentence: circular connector mildtl38999 series i wall mount receptacle 56
60
+ contacts receptacle contacts farnell element14 i amphenol industrial circular
61
+ connector the from amphenol is mildtl38999 series i wall mount receptacle with
62
+ 56 contacts mildtl38999 series i connectors are available in a wide range of shell
63
+ materials and finishes with 48 500 and 1000 hour salt spray plating exposure these
64
+ connectors offer high density contact arrangements in a miniature circular shell
65
+ and combines high coupling durability it has an improved sealing around each contact
66
+ to prevent electrolytic erosion these connectors are available in 9 shell size
67
+ from 9 to 25 and are designed to withstand extreme shock exposure and vibration
68
+ amphenol industrial otherelectronics
69
+ sentences:
70
+ - us buy amphenol aerospace aeri is a stocking distributor of electronic componentsus
71
+ military specification connector 56p size 25 wall mount receptacle sktus otherelectronics
72
+ part number manufacturer amphenol aerospace description military specification
73
+ connector 56p size 25 wall mount receptacle skt warranty 1 year aeri guarantee
74
+ learn more quantity in network 9666 available through the aeri network
75
+ - griots garage 3 random orbital 10ft cord 2001 bmw 325ci base convertible miscellaneous
76
+ page 25 automotive
77
+ - 785247176564 and height is 5 under 10 bulbscom close to ceiling light fixtures
78
+ from progress lighting where diameter 12 18 progress lighting threelight flush
79
+ mount progress lighting brand toolsandhomeimprovement
80
+ - source_sentence: moor brown gb 2014 audi a5s5 cabriolet south africa market body
81
+ middle armrest front pr6e3gb if period 0911 gb automotive
82
+ sentences:
83
+ - apc cork apctopazsn gem topaz stair nose apctopazsn bamboo tile more bruce 78in
84
+ turlington smokey reducer american exotics hardwood flooring accessory sale price
85
+ sq ft gem topaz stair nose apc cork apctopazsn gem topaz stair nose apctopazsn
86
+ instock apc cork toolsandhomeimprovement
87
+ - moor brown gb 2013 audi a4 allroad quattro canada market body middle armrest front
88
+ pr6e3gb if period 1111 gb automotive
89
+ - smart racing products smartstrings 4wheel alignment set 1996 bmw 318i base convertible
90
+ suspension tools page 1 automotive
91
+ ---
92
+
93
+ # SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
94
+
95
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
96
+
97
+ ## Model Details
98
+
99
+ ### Model Description
100
+ - **Model Type:** Sentence Transformer
101
+ - **Base model:** [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2) <!-- at revision 84f2bcc00d77236f9e89c8a360a00fb1139bf47d -->
102
+ - **Maximum Sequence Length:** 384 tokens
103
+ - **Output Dimensionality:** 768 tokens
104
+ - **Similarity Function:** Cosine Similarity
105
+ <!-- - **Training Dataset:** Unknown -->
106
+ <!-- - **Language:** Unknown -->
107
+ <!-- - **License:** Unknown -->
108
+
109
+ ### Model Sources
110
+
111
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
112
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
113
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
114
+
115
+ ### Full Model Architecture
116
+
117
+ ```
118
+ SentenceTransformer(
119
+ (0): Transformer({'max_seq_length': 384, 'do_lower_case': False}) with Transformer model: MPNetModel
120
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
121
+ (2): Normalize()
122
+ )
123
+ ```
124
+
125
+ ## Usage
126
+
127
+ ### Direct Usage (Sentence Transformers)
128
+
129
+ First install the Sentence Transformers library:
130
+
131
+ ```bash
132
+ pip install -U sentence-transformers
133
+ ```
134
+
135
+ Then you can load this model and run inference.
136
+ ```python
137
+ from sentence_transformers import SentenceTransformer
138
+
139
+ # Download from the 🤗 Hub
140
+ model = SentenceTransformer("sentence_transformers_model_id")
141
+ # Run inference
142
+ sentences = [
143
+ 'moor brown gb 2014 audi a5s5 cabriolet south africa market body middle armrest front pr6e3gb if period 0911 gb automotive',
144
+ 'moor brown gb 2013 audi a4 allroad quattro canada market body middle armrest front pr6e3gb if period 1111 gb automotive',
145
+ 'smart racing products smartstrings 4wheel alignment set 1996 bmw 318i base convertible suspension tools page 1 automotive',
146
+ ]
147
+ embeddings = model.encode(sentences)
148
+ print(embeddings.shape)
149
+ # [3, 768]
150
+
151
+ # Get the similarity scores for the embeddings
152
+ similarities = model.similarity(embeddings, embeddings)
153
+ print(similarities.shape)
154
+ # [3, 3]
155
+ ```
156
+
157
+ <!--
158
+ ### Direct Usage (Transformers)
159
+
160
+ <details><summary>Click to see the direct usage in Transformers</summary>
161
+
162
+ </details>
163
+ -->
164
+
165
+ <!--
166
+ ### Downstream Usage (Sentence Transformers)
167
+
168
+ You can finetune this model on your own dataset.
169
+
170
+ <details><summary>Click to expand</summary>
171
+
172
+ </details>
173
+ -->
174
+
175
+ <!--
176
+ ### Out-of-Scope Use
177
+
178
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
179
+ -->
180
+
181
+ <!--
182
+ ## Bias, Risks and Limitations
183
+
184
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
185
+ -->
186
+
187
+ <!--
188
+ ### Recommendations
189
+
190
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
191
+ -->
192
+
193
+ ## Training Details
194
+
195
+ ### Training Dataset
196
+
197
+ #### Unnamed Dataset
198
+
199
+
200
+ * Size: 269,761 training samples
201
+ * Columns: <code>anchor</code> and <code>positive</code>
202
+ * Approximate statistics based on the first 1000 samples:
203
+ | | anchor | positive |
204
+ |:--------|:------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
205
+ | type | string | string |
206
+ | details | <ul><li>min: 15 tokens</li><li>mean: 69.38 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 11 tokens</li><li>mean: 70.41 tokens</li><li>max: 384 tokens</li></ul> |
207
+ * Samples:
208
+ | anchor | positive |
209
+ |:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
210
+ | <code>2008 dodge ram 2500 laramie used white for sale in euless tx dodge automotive mileage 17383 exterior color arctic white transmission 7speed automatic wod engine intercooled turbo diesel i4 21 l131 stock 4gp307369 wdzpe7dd4gp307369 mercedesbenz used sprinter passenger vans mileage 148438 exterior color white transmission 4speed hd automatic wod 4l65e engine gas v8 60l364 stock x4h100607 5grgn23ux4h100607 hummer used h2 mileage 34383 exterior color white satin pearl transmission 8speed automatic wmanual shift engine gas v8 50l307 stock 4du072090 kmhgh4jh4du072090 hyundai used equus mileage 107520 exterior color bright white clearcoat transmission 6speed automatic engine gas i4 24l144 stock xcn207909 1c3ccbbbxcn207909 chrysler used 200 mileage 59582 exterior color bright white clearcoat transmission 6speed automatic engine gas i4 24l144 stock 3dn554452 1c3ccbbb3dn554452 chrysler used 200 mileage 76681 exterior color taffeta white transmission 5speed automatic engine gas i4 24l144 stock 5ag705280 3czre3h35ag705280 honda used crv mileage 99896 exterior color premium white pearl transmission 5speed automatic wod engine gas i4 24l144 stock 6xac03652 jh4cu2f6xac036527 acura used tsx mileage 125522 exterior color crystal white transmission 1speed ecvt engine gaselectric v6 33l202 stock x82851820 jtjgw31ux82851820 lexus used rx 400h mileage 36797 exterior color clear white transmission 6speed automatic wod engine regular unleaded i4 24 l144 stock 0h7070128 kndpm3ac0h7070128 kia used sportage mileage 77058 exterior color bright white clearcoat transmission 5speed automatic engine gas v6 36l220 stock 0dh649637 2c3cdyag0dh649637 dodge used challenger mileage 39319 exterior color arctic white transmission 7speed automatic engine gas v6 30l183 stock 8br178298 wddgf8bb8br178298 mercedesbenz used cclass mileage 64038 exterior color white gold clearcoat transmission 5speed automatic wod engine gas v8 57l345 stock 7bs615073 1d7rb1ct7bs615073 ram used 1500 mileage 69807 exterior color bright white clearcoat transmission 4speed automatic engine gas v8 57l345 stock 9cs228465 1c6rd6ft9cs228465 ram used 1500 mileage 14918 exterior color pearl white transmission 1speed cvt wod engine regular unleaded i4 25 l152 stock xgp686433 knmat2mtxgp686433 nissan used rogue mileage 39730 exterior color fuji white transmission 6speed automatic engine gas i6 32l195 stock xch305122 salfr2bnxch305122 land rover used lr2 mileage 34618 exterior color snow white pearl transmission 6speed automatic wod engine regular unleaded v6 33 l204 stock 6fg577726 5xykw4a76fg577726 kia used sorento mileage 169861 exterior color oxford white transmission 6speed automatic engine turbocharged diesel v8 67l406 stock 1bea21901 1ft7w2bt1bea21901 ford used super duty f250 srw mileage 21309 exterior color pure red transmission 8speed cvt wod engine intercooled turbo premium unleaded h4 20 l122 stock 3g8807653 jf1va1e63g8807653 subaru used wrx mileage 61401 exterior color white gold clearcoat transmission automatic engine gas v8 57l345 stock 5bg609448 3d7tt2ct5bg609448 ram used 2500 mileage 28253 exterior color bright white clearcoat transmission 8speed automatic wod engine regular unleaded v6 36 l220 stock 2ec478489 1c4rjfbg2ec478489 jeep used grand cherokee mileage 33929 exterior color bright white clearcoat transmission 6speed automatic engine gas v8 57l345 stock xdc653013 1c4sdjctxdc653013 dodge used durango mileage 178293 exterior color bright white clearcoat transmission automatic engine diesel i6 67l409 stock 3d3ks29a dodge used ram 2500 mileage 107825 exterior color diamond white metallic transmission 7speed automatic wmanual shift engine turbocharged gas v8 46l285 stock 9da114638 4jgdf7ce9da114638 mercedesbenz used glclass mileage 17831 exterior color cirrus white transmission 7speed autoshift</code> | <code>2008 dodge ram 2500 laramie used white for sale in euless tx dodge automotive mileage 17383 exterior color arctic white transmission 7speed automatic wod engine intercooled turbo diesel i4 21 l131 stock 4gp307369 wdzpe7dd4gp307369 mercedesbenz used sprinter passenger vans mileage 148438 exterior color white transmission 4speed hd automatic wod 4l65e engine gas v8 60l364 stock x4h100607 5grgn23ux4h100607 hummer used h2 mileage 34383 exterior color white satin pearl transmission 8speed automatic wmanual shift engine gas v8 50l307 stock 4du072090 kmhgh4jh4du072090 hyundai used equus mileage 107520 exterior color bright white clearcoat transmission 6speed automatic engine gas i4 24l144 stock xcn207909 1c3ccbbbxcn207909 chrysler used 200 mileage 59582 exterior color bright white clearcoat transmission 6speed automatic engine gas i4 24l144 stock 3dn554452 1c3ccbbb3dn554452 chrysler used 200 mileage 76681 exterior color taffeta white transmission 5speed automatic engine gas i4 24l144 stock 5ag705280 3czre3h35ag705280 honda used crv mileage 99896 exterior color premium white pearl transmission 5speed automatic wod engine gas i4 24l144 stock 6xac03652 jh4cu2f6xac036527 acura used tsx mileage 125522 exterior color crystal white transmission 1speed ecvt engine gaselectric v6 33l202 stock x82851820 jtjgw31ux82851820 lexus used rx 400h mileage 36797 exterior color clear white transmission 6speed automatic wod engine regular unleaded i4 24 l144 stock 0h7070128 kndpm3ac0h7070128 kia used sportage mileage 77058 exterior color bright white clearcoat transmission 5speed automatic engine gas v6 36l220 stock 0dh649637 2c3cdyag0dh649637 dodge used challenger mileage 39319 exterior color arctic white transmission 7speed automatic engine gas v6 30l183 stock 8br178298 wddgf8bb8br178298 mercedesbenz used cclass mileage 64038 exterior color white gold clearcoat transmission 5speed automatic wod engine gas v8 57l345 stock 7bs615073 1d7rb1ct7bs615073 ram used 1500 mileage 69807 exterior color bright white clearcoat transmission 4speed automatic engine gas v8 57l345 stock 9cs228465 1c6rd6ft9cs228465 ram used 1500 mileage 14918 exterior color pearl white transmission 1speed cvt wod engine regular unleaded i4 25 l152 stock xgp686433 knmat2mtxgp686433 nissan used rogue mileage 39730 exterior color fuji white transmission 6speed automatic engine gas i6 32l195 stock xch305122 salfr2bnxch305122 land rover used lr2 mileage 34618 exterior color snow white pearl transmission 6speed automatic wod engine regular unleaded v6 33 l204 stock 6fg577726 5xykw4a76fg577726 kia used sorento mileage 169861 exterior color oxford white transmission 6speed automatic engine turbocharged diesel v8 67l406 stock 1bea21901 1ft7w2bt1bea21901 ford used super duty f250 srw mileage 21309 exterior color pure red transmission 8speed cvt wod engine intercooled turbo premium unleaded h4 20 l122 stock 3g8807653 jf1va1e63g8807653 subaru used wrx mileage 61401 exterior color white gold clearcoat transmission automatic engine gas v8 57l345 stock 5bg609448 3d7tt2ct5bg609448 ram used 2500 mileage 28253 exterior color bright white clearcoat transmission 8speed automatic wod engine regular unleaded v6 36 l220 stock 2ec478489 1c4rjfbg2ec478489 jeep used grand cherokee mileage 33929 exterior color bright white clearcoat transmission 6speed automatic engine gas v8 57l345 stock xdc653013 1c4sdjctxdc653013 dodge used durango mileage 178293 exterior color bright white clearcoat transmission automatic engine diesel i6 67l409 stock 3d3ks29a dodge used ram 2500 mileage 107825 exterior color diamond white metallic transmission 7speed automatic wmanual shift engine turbocharged gas v8 46l285 stock 9da114638 4jgdf7ce9da114638 mercedesbenz used glclass mileage 17831 exterior color cirrus white transmission 7speed autoshift</code> |
211
+ | <code>pacon fade resistant neon poster board us pacon officesupplycomus officeproducts</code> | <code>pacon fade resistant neon poster board us pacon officesupplycomus officeproducts</code> |
212
+ | <code>2015 bmw 535i xdrive sedan texas 76132 2015 535 lease special promotion on a for 87681 per month fort worth automotive</code> | <code>2015 bmw 535i xdrive sedan florida 34787 2015 535 xdriv lease special promotion on sedan a for 76289 per month winter garden automotive listing number car bmw 535i xdrive sedan condition outstanding transmission automatic vin wba5b3c59fd540941 down payment 000 down engine 6 cylinder fuel type gasoline doors four door drivetrain four wheel drive rear brake width 09 emergency braking preparation emergency braking preparation brake drying brake drying front brake width 14 rear brake type ventilated disc electronic brakeforce distribution electronic brakeforce distribution front brake diameter 137 front brake type ventilated disc antilock braking system 4wheel abs braking assist braking assist rear brake diameter 130 overall width without mirrors 732 wheelbase 1169 overall length 1931 minimum ground clearance 56 overall height 576 rear track 641 front track 630 ege highway mpg 29 epa combined mpg 23 manufacturer 0 100km acceleration time seconds 58 aerodynamic drag cd 030 epa city mpg 19 turning diameter 392 curb weight 4233 tco curb weight 4233 epa highway mpg 29 fuel capacity 185 ege city mpg 19 height adjustable driver seat height adjustable driver seat adjustable lumbar power adjustable lumbar support driver seat whiplash protection whiplash protection system driver seat easy entry power steering wheel number of driver seat power adjustments 10 number of memorized driver seat settings 2 adjustable driver seat headrest power adjustable headrests 2nd row leg room 361 2nd row shoulder room 562 2nd row head room 383 1st row leg room 414 1st row head room 405 1st row shoulder room 583 epa interior volume 116 in dash cd single cd player audio system memory feature includes audio system digital audio input auxiliary audio input and ipodiphone integration total number of speakers 10 mp3 player cd mp3 playback antenna type diversity audio security system audio security system usb connection usb connection radio data system radio data system radio amfm hd radio watts 180 subwoofer 2 rear tire width 245 run flat tires run flat tire type all season rear tire diameter 18 rear tire profile 45 rear tire speed rating v rear tire width 245 run flat tires run flat tire type all season rear tire diameter 19 rear tire profile 40 in dash cd single cd player digital audio input auxiliary audio input and ipodiphone integration total number of speakers 16 mp3 player cd mp3 playback speed sensitive volume control speed sensitive volume control radio data system radio data system dvd audio dvdaudio radio amfm hd radio satellite radio sirius watts 600 surround audio 51 months of provided satellite radio service 12 rear tire width 245 run flat tires run flat tire type all season rear tire diameter 19 rear tire profile 40 warranty maximum mileage 50000 warranty miles limitedunlimited l warranty years limitedunlimited l warranty maximum years 4 warranty type basic warranty maximum mileage 50000 warranty miles limitedunlimited l warranty years limitedunlimited l warranty maximum years 4 warranty type drivetrain warranty maximum mileage 50000 warranty comments free full maintenance for 4 years or 50000 miles warranty miles limitedunlimited l warranty years limitedunlimited l warranty maximum years 4 warranty</code> |
213
+ * Loss: [<code>CachedMultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedmultiplenegativesrankingloss) with these parameters:
214
+ ```json
215
+ {
216
+ "scale": 20.0,
217
+ "similarity_fct": "cos_sim"
218
+ }
219
+ ```
220
+
221
+ ### Evaluation Dataset
222
+
223
+ #### Unnamed Dataset
224
+
225
+
226
+ * Size: 67,441 evaluation samples
227
+ * Columns: <code>anchor</code> and <code>positive</code>
228
+ * Approximate statistics based on the first 1000 samples:
229
+ | | anchor | positive |
230
+ |:--------|:------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
231
+ | type | string | string |
232
+ | details | <ul><li>min: 14 tokens</li><li>mean: 68.57 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 15 tokens</li><li>mean: 69.25 tokens</li><li>max: 384 tokens</li></ul> |
233
+ * Samples:
234
+ | anchor | positive |
235
+ |:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
236
+ | <code>barracuda essentials for office 365 complete protection and compliance li barracuda li email security cdwgcom five year license renewal for barracuda essentials for office 365 complete protection for up to 249 users otherelectronics</code> | <code>barracuda essentials for office 365 complete protection and compliance li barracuda li email security cdwcom five year license renewal for barracuda essentials for office 365 complete protection for up to 249 users otherelectronics</code> |
237
+ | <code>cool carbon performance brake pad set rear 2003 bmw 325i base sedan upgrades page 2 automotive</code> | <code>cool carbon performance brake pad set rear 2002 bmw 325i base wagon upgrades page 2 automotive</code> |
238
+ | <code>decoart americana acrylic paint williamsburg blue 2 ounces blue 2 oz cover art projects with affordable quality our 2ounce bottle of americana acrylic paint in williamsburg blue boasts a bright pigment that can be used on almost any surface once dry this paint will create a durable matte finish that can be varnished to create a variety of sheens blue acrylic paint permanent waterbased nontoxic lightfast pigment one coat coverage with most colors intermixable blends easily consistent viscosity made in usa toolsandhomeimprovement</code> | <code>decoart americana acrylic paint williamsburg blue 2 oz wholesale darice decoart americana acrylic paint williamsburg blue 2 oz decoart toolsandhomeimprovement</code> |
239
+ * Loss: [<code>CachedMultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cachedmultiplenegativesrankingloss) with these parameters:
240
+ ```json
241
+ {
242
+ "scale": 20.0,
243
+ "similarity_fct": "cos_sim"
244
+ }
245
+ ```
246
+
247
+ ### Training Hyperparameters
248
+ #### Non-Default Hyperparameters
249
+
250
+ - `eval_strategy`: steps
251
+ - `learning_rate`: 1e-05
252
+ - `num_train_epochs`: 2
253
+ - `warmup_ratio`: 0.1
254
+ - `fp16`: True
255
+ - `auto_find_batch_size`: True
256
+ - `batch_sampler`: no_duplicates
257
+
258
+ #### All Hyperparameters
259
+ <details><summary>Click to expand</summary>
260
+
261
+ - `overwrite_output_dir`: False
262
+ - `do_predict`: False
263
+ - `eval_strategy`: steps
264
+ - `prediction_loss_only`: True
265
+ - `per_device_train_batch_size`: 8
266
+ - `per_device_eval_batch_size`: 8
267
+ - `per_gpu_train_batch_size`: None
268
+ - `per_gpu_eval_batch_size`: None
269
+ - `gradient_accumulation_steps`: 1
270
+ - `eval_accumulation_steps`: None
271
+ - `torch_empty_cache_steps`: None
272
+ - `learning_rate`: 1e-05
273
+ - `weight_decay`: 0.0
274
+ - `adam_beta1`: 0.9
275
+ - `adam_beta2`: 0.999
276
+ - `adam_epsilon`: 1e-08
277
+ - `max_grad_norm`: 1.0
278
+ - `num_train_epochs`: 2
279
+ - `max_steps`: -1
280
+ - `lr_scheduler_type`: linear
281
+ - `lr_scheduler_kwargs`: {}
282
+ - `warmup_ratio`: 0.1
283
+ - `warmup_steps`: 0
284
+ - `log_level`: passive
285
+ - `log_level_replica`: warning
286
+ - `log_on_each_node`: True
287
+ - `logging_nan_inf_filter`: True
288
+ - `save_safetensors`: True
289
+ - `save_on_each_node`: False
290
+ - `save_only_model`: False
291
+ - `restore_callback_states_from_checkpoint`: False
292
+ - `no_cuda`: False
293
+ - `use_cpu`: False
294
+ - `use_mps_device`: False
295
+ - `seed`: 42
296
+ - `data_seed`: None
297
+ - `jit_mode_eval`: False
298
+ - `use_ipex`: False
299
+ - `bf16`: False
300
+ - `fp16`: True
301
+ - `fp16_opt_level`: O1
302
+ - `half_precision_backend`: auto
303
+ - `bf16_full_eval`: False
304
+ - `fp16_full_eval`: False
305
+ - `tf32`: None
306
+ - `local_rank`: 0
307
+ - `ddp_backend`: None
308
+ - `tpu_num_cores`: None
309
+ - `tpu_metrics_debug`: False
310
+ - `debug`: []
311
+ - `dataloader_drop_last`: False
312
+ - `dataloader_num_workers`: 0
313
+ - `dataloader_prefetch_factor`: None
314
+ - `past_index`: -1
315
+ - `disable_tqdm`: False
316
+ - `remove_unused_columns`: True
317
+ - `label_names`: None
318
+ - `load_best_model_at_end`: False
319
+ - `ignore_data_skip`: False
320
+ - `fsdp`: []
321
+ - `fsdp_min_num_params`: 0
322
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
323
+ - `fsdp_transformer_layer_cls_to_wrap`: None
324
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
325
+ - `deepspeed`: None
326
+ - `label_smoothing_factor`: 0.0
327
+ - `optim`: adamw_torch
328
+ - `optim_args`: None
329
+ - `adafactor`: False
330
+ - `group_by_length`: False
331
+ - `length_column_name`: length
332
+ - `ddp_find_unused_parameters`: None
333
+ - `ddp_bucket_cap_mb`: None
334
+ - `ddp_broadcast_buffers`: False
335
+ - `dataloader_pin_memory`: True
336
+ - `dataloader_persistent_workers`: False
337
+ - `skip_memory_metrics`: True
338
+ - `use_legacy_prediction_loop`: False
339
+ - `push_to_hub`: False
340
+ - `resume_from_checkpoint`: None
341
+ - `hub_model_id`: None
342
+ - `hub_strategy`: every_save
343
+ - `hub_private_repo`: False
344
+ - `hub_always_push`: False
345
+ - `gradient_checkpointing`: False
346
+ - `gradient_checkpointing_kwargs`: None
347
+ - `include_inputs_for_metrics`: False
348
+ - `eval_do_concat_batches`: True
349
+ - `fp16_backend`: auto
350
+ - `push_to_hub_model_id`: None
351
+ - `push_to_hub_organization`: None
352
+ - `mp_parameters`:
353
+ - `auto_find_batch_size`: True
354
+ - `full_determinism`: False
355
+ - `torchdynamo`: None
356
+ - `ray_scope`: last
357
+ - `ddp_timeout`: 1800
358
+ - `torch_compile`: False
359
+ - `torch_compile_backend`: None
360
+ - `torch_compile_mode`: None
361
+ - `dispatch_batches`: None
362
+ - `split_batches`: None
363
+ - `include_tokens_per_second`: False
364
+ - `include_num_input_tokens_seen`: False
365
+ - `neftune_noise_alpha`: None
366
+ - `optim_target_modules`: None
367
+ - `batch_eval_metrics`: False
368
+ - `eval_on_start`: False
369
+ - `eval_use_gather_object`: False
370
+ - `batch_sampler`: no_duplicates
371
+ - `multi_dataset_batch_sampler`: proportional
372
+
373
+ </details>
374
+
375
+ ### Training Logs
376
+ | Epoch | Step | Training Loss | loss |
377
+ |:------:|:-----:|:-------------:|:------:|
378
+ | 0.2076 | 7000 | 0.015 | 0.0053 |
379
+ | 0.4152 | 14000 | 0.0059 | 0.0042 |
380
+ | 0.6228 | 21000 | 0.0041 | 0.0034 |
381
+ | 0.8303 | 28000 | 0.0038 | 0.0030 |
382
+ | 1.0379 | 35000 | 0.0028 | 0.0026 |
383
+ | 1.2455 | 42000 | 0.0023 | 0.0023 |
384
+ | 1.4531 | 49000 | 0.0011 | 0.0023 |
385
+ | 1.6607 | 56000 | 0.0008 | 0.0020 |
386
+ | 1.8683 | 63000 | 0.0007 | 0.0020 |
387
+
388
+
389
+ ### Framework Versions
390
+ - Python: 3.10.13
391
+ - Sentence Transformers: 3.0.1
392
+ - Transformers: 4.44.0
393
+ - PyTorch: 2.2.1
394
+ - Accelerate: 0.33.0
395
+ - Datasets: 2.21.0
396
+ - Tokenizers: 0.19.1
397
+
398
+ ## Citation
399
+
400
+ ### BibTeX
401
+
402
+ #### Sentence Transformers
403
+ ```bibtex
404
+ @inproceedings{reimers-2019-sentence-bert,
405
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
406
+ author = "Reimers, Nils and Gurevych, Iryna",
407
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
408
+ month = "11",
409
+ year = "2019",
410
+ publisher = "Association for Computational Linguistics",
411
+ url = "https://arxiv.org/abs/1908.10084",
412
+ }
413
+ ```
414
+
415
+ #### CachedMultipleNegativesRankingLoss
416
+ ```bibtex
417
+ @misc{gao2021scaling,
418
+ title={Scaling Deep Contrastive Learning Batch Size under Memory Limited Setup},
419
+ author={Luyu Gao and Yunyi Zhang and Jiawei Han and Jamie Callan},
420
+ year={2021},
421
+ eprint={2101.06983},
422
+ archivePrefix={arXiv},
423
+ primaryClass={cs.LG}
424
+ }
425
+ ```
426
+
427
+ <!--
428
+ ## Glossary
429
+
430
+ *Clearly define terms in order to be accessible across audiences.*
431
+ -->
432
+
433
+ <!--
434
+ ## Model Card Authors
435
+
436
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
437
+ -->
438
+
439
+ <!--
440
+ ## Model Card Contact
441
+
442
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
443
+ -->
config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "sentence-transformers/all-mpnet-base-v2",
3
+ "architectures": [
4
+ "MPNetModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 514,
16
+ "model_type": "mpnet",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 1,
20
+ "relative_attention_num_buckets": 32,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.44.0",
23
+ "vocab_size": 30527
24
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "3.0.1",
4
+ "transformers": "4.44.0",
5
+ "pytorch": "2.2.1"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": null
10
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:350c045b0cc4a1fde351cb517ebbf9321d8f845c005f861dcdbfde1aa808e11f
3
+ size 437967672
modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab5451d0793fe3e5146400709c5531a801046623aca2878ee049539941012788
3
+ size 871331770
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b90d5e27a1f660fb1d1c2b5edab918da19f9529b58c2027fa695a861b03e1e38
3
+ size 14244
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73603bea8e276e4f4072b153ce72b677a332cff82200e98e51fd251791972529
3
+ size 1064
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 384,
3
+ "do_lower_case": false
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "[UNK]",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": true,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "104": {
36
+ "content": "[UNK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "30526": {
44
+ "content": "<mask>",
45
+ "lstrip": true,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ }
51
+ },
52
+ "bos_token": "<s>",
53
+ "clean_up_tokenization_spaces": true,
54
+ "cls_token": "<s>",
55
+ "do_lower_case": true,
56
+ "eos_token": "</s>",
57
+ "mask_token": "<mask>",
58
+ "max_length": 128,
59
+ "model_max_length": 384,
60
+ "pad_to_multiple_of": null,
61
+ "pad_token": "<pad>",
62
+ "pad_token_type_id": 0,
63
+ "padding_side": "right",
64
+ "sep_token": "</s>",
65
+ "stride": 0,
66
+ "strip_accents": null,
67
+ "tokenize_chinese_chars": true,
68
+ "tokenizer_class": "MPNetTokenizer",
69
+ "truncation_side": "right",
70
+ "truncation_strategy": "longest_first",
71
+ "unk_token": "[UNK]"
72
+ }
trainer_state.json ADDED
@@ -0,0 +1,168 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 1.8682719966786276,
5
+ "eval_steps": 7000,
6
+ "global_step": 63000,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.2075857774087364,
13
+ "grad_norm": 6.259258952923119e-05,
14
+ "learning_rate": 9.958482297312883e-06,
15
+ "loss": 0.015,
16
+ "step": 7000
17
+ },
18
+ {
19
+ "epoch": 0.2075857774087364,
20
+ "eval_loss": 0.005288162734359503,
21
+ "eval_runtime": 299.0787,
22
+ "eval_samples_per_second": 225.496,
23
+ "eval_steps_per_second": 28.19,
24
+ "step": 7000
25
+ },
26
+ {
27
+ "epoch": 0.4151715548174728,
28
+ "grad_norm": 0.0349661149084568,
29
+ "learning_rate": 8.805542283803155e-06,
30
+ "loss": 0.0059,
31
+ "step": 14000
32
+ },
33
+ {
34
+ "epoch": 0.4151715548174728,
35
+ "eval_loss": 0.004213849548250437,
36
+ "eval_runtime": 305.6778,
37
+ "eval_samples_per_second": 220.628,
38
+ "eval_steps_per_second": 27.581,
39
+ "step": 14000
40
+ },
41
+ {
42
+ "epoch": 0.6227573322262092,
43
+ "grad_norm": 0.0007877133903093636,
44
+ "learning_rate": 7.652767023081867e-06,
45
+ "loss": 0.0041,
46
+ "step": 21000
47
+ },
48
+ {
49
+ "epoch": 0.6227573322262092,
50
+ "eval_loss": 0.0033566548954695463,
51
+ "eval_runtime": 304.5219,
52
+ "eval_samples_per_second": 221.465,
53
+ "eval_steps_per_second": 27.686,
54
+ "step": 21000
55
+ },
56
+ {
57
+ "epoch": 0.8303431096349456,
58
+ "grad_norm": 0.006591067183762789,
59
+ "learning_rate": 6.50015651514902e-06,
60
+ "loss": 0.0038,
61
+ "step": 28000
62
+ },
63
+ {
64
+ "epoch": 0.8303431096349456,
65
+ "eval_loss": 0.003017185255885124,
66
+ "eval_runtime": 310.7502,
67
+ "eval_samples_per_second": 217.026,
68
+ "eval_steps_per_second": 27.131,
69
+ "step": 28000
70
+ },
71
+ {
72
+ "epoch": 1.037928887043682,
73
+ "grad_norm": 6.050535012036562e-05,
74
+ "learning_rate": 5.3470517488508496e-06,
75
+ "loss": 0.0028,
76
+ "step": 35000
77
+ },
78
+ {
79
+ "epoch": 1.037928887043682,
80
+ "eval_loss": 0.00263745104894042,
81
+ "eval_runtime": 318.0582,
82
+ "eval_samples_per_second": 212.04,
83
+ "eval_steps_per_second": 26.508,
84
+ "step": 35000
85
+ },
86
+ {
87
+ "epoch": 1.2455146644524184,
88
+ "grad_norm": 0.0005422074464149773,
89
+ "learning_rate": 4.194276488129561e-06,
90
+ "loss": 0.0023,
91
+ "step": 42000
92
+ },
93
+ {
94
+ "epoch": 1.2455146644524184,
95
+ "eval_loss": 0.002334447344765067,
96
+ "eval_runtime": 308.969,
97
+ "eval_samples_per_second": 218.278,
98
+ "eval_steps_per_second": 27.288,
99
+ "step": 42000
100
+ },
101
+ {
102
+ "epoch": 1.4531004418611548,
103
+ "grad_norm": 4.648882895708084e-05,
104
+ "learning_rate": 3.041501227408274e-06,
105
+ "loss": 0.0011,
106
+ "step": 49000
107
+ },
108
+ {
109
+ "epoch": 1.4531004418611548,
110
+ "eval_loss": 0.0022575457114726305,
111
+ "eval_runtime": 293.5363,
112
+ "eval_samples_per_second": 229.753,
113
+ "eval_steps_per_second": 28.722,
114
+ "step": 49000
115
+ },
116
+ {
117
+ "epoch": 1.6606862192698912,
118
+ "grad_norm": 5.3200383263174444e-05,
119
+ "learning_rate": 1.8890554722638682e-06,
120
+ "loss": 0.0008,
121
+ "step": 56000
122
+ },
123
+ {
124
+ "epoch": 1.6606862192698912,
125
+ "eval_loss": 0.0020312555134296417,
126
+ "eval_runtime": 311.6551,
127
+ "eval_samples_per_second": 216.396,
128
+ "eval_steps_per_second": 27.052,
129
+ "step": 56000
130
+ },
131
+ {
132
+ "epoch": 1.8682719966786276,
133
+ "grad_norm": 7.308552449103445e-05,
134
+ "learning_rate": 7.359507059656985e-07,
135
+ "loss": 0.0007,
136
+ "step": 63000
137
+ },
138
+ {
139
+ "epoch": 1.8682719966786276,
140
+ "eval_loss": 0.00200638803653419,
141
+ "eval_runtime": 310.1684,
142
+ "eval_samples_per_second": 217.433,
143
+ "eval_steps_per_second": 27.182,
144
+ "step": 63000
145
+ }
146
+ ],
147
+ "logging_steps": 7000,
148
+ "max_steps": 67442,
149
+ "num_input_tokens_seen": 0,
150
+ "num_train_epochs": 2,
151
+ "save_steps": 7000,
152
+ "stateful_callbacks": {
153
+ "TrainerControl": {
154
+ "args": {
155
+ "should_epoch_stop": false,
156
+ "should_evaluate": false,
157
+ "should_log": false,
158
+ "should_save": true,
159
+ "should_training_stop": false
160
+ },
161
+ "attributes": {}
162
+ }
163
+ },
164
+ "total_flos": 0.0,
165
+ "train_batch_size": 8,
166
+ "trial_name": null,
167
+ "trial_params": null
168
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02125f25240f4429166e8393a541fdcc5432811b50b3a49497faf680e6e1edb8
3
+ size 5432
vocab.txt ADDED
The diff for this file is too large to render. See raw diff