Skip to content

Commit

Permalink
chore(model): update llama model to predeploy model
Browse files Browse the repository at this point in the history
  • Loading branch information
tonywang10101 committed Oct 21, 2023
1 parent c1dc507 commit 8ba74c3
Show file tree
Hide file tree
Showing 2 changed files with 24 additions and 4 deletions.
16 changes: 13 additions & 3 deletions model-hub/model_hub_cpu.json
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,8 @@
"task": "TASK_CLASSIFICATION",
"model_definition": "model-definitions/github",
"configuration": {
"repository": "instill-ai/model-mobilenetv2-dvc",
"tag": "v1.0-cpu"
"repository": "instill-ai/model-mobilenetv2-dvc",
"tag": "v1.0-cpu"
}
},
{
Expand Down Expand Up @@ -77,5 +77,15 @@
"repository": "instill-ai/model-diffusion-dvc",
"tag": "v1.5-cpu"
}
},
{
"id": "llama2-7b",
"description": "Llama2-7b, from meta, is trained to generate text based on your prompts.",
"task": "TASK_TEXT_GENERATION",
"model_definition": "model-definitions/github",
"configuration": {
"repository": "instill-ai/model-llama2-7b-dvc",
"tag": "fp32-7b-hf-tf-cpu"
}
}
]
]
12 changes: 11 additions & 1 deletion model-hub/model_hub_gpu.json
Original file line number Diff line number Diff line change
Expand Up @@ -78,5 +78,15 @@
"repository": "instill-ai/model-gpt2-megatron-dvc",
"tag": "fp32-345m-1-gpu"
}
},
{
"id": "llama2-7b",
"description": "Llama2-7b, from meta, is trained to generate text based on your prompts.",
"task": "TASK_TEXT_GENERATION",
"model_definition": "model-definitions/github",
"configuration": {
"repository": "instill-ai/model-llama2-7b-dvc",
"tag": "fp16-7b-vllm-p80-1gpu"
}
}
]
]

0 comments on commit 8ba74c3

Please sign in to comment.