sagemaker-models / model.json
philschmid's picture
Update model.json with amazon/FalconLite instance recommendation (#1)
ff19e10
raw
history blame contribute delete
904 Bytes
{
"inference": {
"gpt2": {
"instanceType": "ml.g4dn.xlarge",
"numShard": 1
},
"google/flan-t5-xxl": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"bigscience/bloom-7b1": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"EleutherAI/gpt-neo-2.7B": {
"instanceType": "ml.g5.xlarge",
"numShard": 1
},
"tiiuae/falcon-40b-instruct": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"EleutherAI/gpt-neox-20b": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"bigcode/starcoder": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"openlm-research/open_llama_13b": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
},
"amazon/FalconLite": {
"instanceType": "ml.g5.12xlarge",
"numShard": 4
}
},
"training":{}
}