From eb358e8f7ca23da76c582c01065235c179ba9877 Mon Sep 17 00:00:00 2001 From: Suvratpalt <142586261+Suvratpalt@users.noreply.github.com> Date: Fri, 2 Feb 2024 22:03:11 +0530 Subject: [PATCH] HuggingFaceH4-starchat-beta --- assets/models/system/starchat-beta/asset.yaml | 4 ++ .../system/starchat-beta/description.md | 62 +++++++++++++++++ assets/models/system/starchat-beta/model.yaml | 8 +++ assets/models/system/starchat-beta/spec.yaml | 68 +++++++++++++++++++ 4 files changed, 142 insertions(+) create mode 100644 assets/models/system/starchat-beta/asset.yaml create mode 100644 assets/models/system/starchat-beta/description.md create mode 100644 assets/models/system/starchat-beta/model.yaml create mode 100644 assets/models/system/starchat-beta/spec.yaml diff --git a/assets/models/system/starchat-beta/asset.yaml b/assets/models/system/starchat-beta/asset.yaml new file mode 100644 index 0000000000..eef472df50 --- /dev/null +++ b/assets/models/system/starchat-beta/asset.yaml @@ -0,0 +1,4 @@ +extra_config: model.yaml +spec: spec.yaml +type: model +categories: ["Foundation Models", "Text Generation"] diff --git a/assets/models/system/starchat-beta/description.md b/assets/models/system/starchat-beta/description.md new file mode 100644 index 0000000000..c298faa7db --- /dev/null +++ b/assets/models/system/starchat-beta/description.md @@ -0,0 +1,62 @@ +# **Model Details** + +Name: HuggingFaceH4/starchat-beta +StarChat is a series of language models designed as helpful coding assistants. StarChat-β, the second model in this series, is a fine-tuned version of StarCoderPlus. The fine-tuning utilizes an "uncensored" variant of the openassistant-guanaco dataset, enhancing performance on coding tasks. Note that this model may produce problematic outputs when prompted. + +Model Details: + +Model type: A 16B parameter GPT-like model fine-tuned on an "uncensored" variant of the openassistant-guanaco dataset. +Language(s): Primarily English and supports 80+ programming languages. +License: BigCode Open RAIL-M v1 +Finetuned from: bigcode/starcoderplus +Model Sources: + +Intended Uses & Limitations: +Intended for chat and coding assistance. +Caution advised for potential problematic outputs. +Bias and demographic skewing from GitHub community demographics. +May produce syntactically valid but semantically incorrect code. +Potential for generating false URLs that require careful inspection. +Training and Evaluation: + +Trained on "uncensored" openassistant-guanaco dataset. +Utilizes the ShareGPT filtering recipe behind the WizardLM. +Hyperparameters, including learning rate, batch size, and others, specified for training. +In summary, StarChat-β serves as a coding assistant, trained and fine-tuned for code-related tasks, offering capabilities in multiple programming languages. Users are cautioned about potential problematic outputs and advised to use the model responsibly for educational and research purposes. + +Repository: https://github.com/bigcode-project/starcoder +Demo: https://huggingface.co/spaces/HuggingFaceH4/starchat-playground + +# **Inference samples** + +Inference type|Python sample (Notebook)|CLI with YAML +|--|--|--| +Real time|text-generation-online-endpoint.ipynb|text-generation-online-endpoint.sh +Batch |text-generation-batch-endpoint.ipynb| coming soon + + +# **Sample inputs and outputs** + +### **Sample input** +```json +{ + "input_data":{ + "input_string":["the meaning of life is"], + "parameters":{ + "temperature":0.5, + "top_p":0.5, + "max_new_tokens":10, + "do_sample":true + } + } +} +``` + +### **Sample output** +```json +[ + { + "0": "the meaning of life is to find your gift. the purpose of life is" + } +] +``` diff --git a/assets/models/system/starchat-beta/model.yaml b/assets/models/system/starchat-beta/model.yaml new file mode 100644 index 0000000000..86d54772c5 --- /dev/null +++ b/assets/models/system/starchat-beta/model.yaml @@ -0,0 +1,8 @@ +path: + container_name: models + container_path: huggingface/HuggingFaceH4-starchat-beta/1706255740/mlflow_model_folder + storage_name: automlcesdkdataresources + type: azureblob +publish: + description: description.md + type: mlflow_model diff --git a/assets/models/system/starchat-beta/spec.yaml b/assets/models/system/starchat-beta/spec.yaml new file mode 100644 index 0000000000..99e1d933bc --- /dev/null +++ b/assets/models/system/starchat-beta/spec.yaml @@ -0,0 +1,68 @@ +$schema: https://azuremlschemas.azureedge.net/latest/model.schema.json +name: HuggingFaceH4-starchat-beta +path: ./ +properties: + SharedComputeCapacityEnabled: true + SHA: b1bcda690655777373f57ea6614eb095ec2c886f + inference-min-sku-spec: 12|1|220|64 + inference-recommended-sku: Standard_NC12s_v3, Standard_NC24s_v3, Standard_ND40rs_v2, Standard_NC24ads_A100_v4, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4, Standard_ND96asr_v4 + evaluation-min-sku-spec: 6|1|112|128 + evaluation-recommended-sku: Standard_NC6s_v3, Standard_NC12s_v3, Standard_NC24s_v3, Standard_NC24rs_v3, Standard_ND40rs_v2, Standard_NC48ads_A100_v4, Standard_NC96ads_A100_v4, Standard_ND96amsr_A100_v4, Standard_ND96asr_v4 + finetune-min-sku-spec: 40|8|672|2900 + finetune-recommended-sku: Standard_ND40rs_v2, Standard_ND96amsr_A100_v4, Standard_ND96asr_v4 + finetuning-tasks: text-generation + languages : en + license : bigcode-openrail-m + +tags: + Featured: "" + SharedComputeCapacityEnabled: "" + huggingface_model_id: HuggingFaceH4/starchat-beta + inference_compute_allow_list: + [ + STANDARD_DS4_V2 + Standard_DS5_v2, + Standard_D16a_v4, + Standard_D16as_v4, + Standard_D32a_v4, + Standard_D32as_v4, + Standard_D48a_v4, + Standard_D48as_v4, + Standard_D64a_v4, + Standard_D64as_v4, + Standard_D96a_v4, + Standard_D96as_v4, + Standard_F4s_v2, + Standard_FX4mds, + Standard_F8s_v2, + Standard_FX12mds, + Standard_F16s_v2, + Standard_F32s_v2, + Standard_F48s_v2, + Standard_F64s_v2, + Standard_F72s_v2, + Standard_FX24mds, + Standard_FX36mds, + Standard_FX48mds, + Standard_E2s_v3, + Standard_E4s_v3, + Standard_E8s_v3, + Standard_E16s_v3, + Standard_E32s_v3, + Standard_E48s_v3, + Standard_E64s_v3, + Standard_NC4as_T4_v3, + Standard_NC6s_v3, + Standard_NC8as_T4_v3, + Standard_NC12s_v3, + Standard_NC16as_T4_v3, + Standard_NC24s_v3, + Standard_NC64as_T4_v3, + Standard_NC24ads_A100_v4, + Standard_NC48ads_A100_v4, + Standard_NC96ads_A100_v4, + Standard_ND96asr_v4, + Standard_ND96amsr_A100_v4, + Standard_ND40rs_v2, + ] +version: 1 \ No newline at end of file