|
118 | 118 | "scope": "container",
|
119 | 119 | },
|
120 | 120 | ],
|
| 121 | + "default_inference_instance_type": "", |
| 122 | + "supported_inference_instance_types": None, |
| 123 | + "default_training_instance_type": None, |
| 124 | + "supported_training_instance_types": [], |
| 125 | + "inference_vulnerable": False, |
| 126 | + "inference_dependencies": [], |
| 127 | + "inference_vulnerabilities": [], |
| 128 | + "training_vulnerable": False, |
| 129 | + "training_dependencies": [], |
| 130 | + "training_vulnerabilities": [], |
| 131 | + "deprecated": False, |
| 132 | + "metrics": [], |
| 133 | + }, |
| 134 | + "huggingface-text2text-flan-t5-xxl-fp16": { |
| 135 | + "model_id": "huggingface-text2text-flan-t5-xxl-fp16", |
| 136 | + "url": "https://huggingface.co/google/flan-t5-xxl", |
| 137 | + "version": "1.0.0", |
| 138 | + "min_sdk_version": "2.130.0", |
| 139 | + "training_supported": False, |
| 140 | + "incremental_training_supported": False, |
| 141 | + "hosting_ecr_specs": { |
| 142 | + "framework": "pytorch", |
| 143 | + "framework_version": "1.12.0", |
| 144 | + "py_version": "py38", |
| 145 | + "huggingface_transformers_version": "4.17.0", |
| 146 | + }, |
| 147 | + "hosting_artifact_key": "huggingface-infer/infer-huggingface-text2text-flan-t5-xxl-fp16.tar.gz", |
| 148 | + "hosting_script_key": "source-directory-tarballs/huggingface/inference/text2text/v1.0.2/sourcedir.tar.gz", |
| 149 | + "hosting_prepacked_artifact_key": "huggingface-infer/prepack/v1.0.0/infer-prepack-huggingface-" |
| 150 | + "text2text-flan-t5-xxl-fp16.tar.gz", |
| 151 | + "hosting_prepacked_artifact_version": "1.0.0", |
| 152 | + "inference_vulnerable": False, |
| 153 | + "inference_dependencies": [ |
| 154 | + "accelerate==0.16.0", |
| 155 | + "bitsandbytes==0.37.0", |
| 156 | + "filelock==3.9.0", |
| 157 | + "huggingface-hub==0.12.0", |
| 158 | + "regex==2022.7.9", |
| 159 | + "tokenizers==0.13.2", |
| 160 | + "transformers==4.26.0", |
| 161 | + ], |
| 162 | + "inference_vulnerabilities": [], |
| 163 | + "training_vulnerable": False, |
| 164 | + "training_dependencies": [], |
| 165 | + "training_vulnerabilities": [], |
| 166 | + "deprecated": False, |
| 167 | + "inference_environment_variables": [ |
| 168 | + { |
| 169 | + "name": "SAGEMAKER_PROGRAM", |
| 170 | + "type": "text", |
| 171 | + "default": "inference.py", |
| 172 | + "scope": "container", |
| 173 | + }, |
| 174 | + { |
| 175 | + "name": "SAGEMAKER_SUBMIT_DIRECTORY", |
| 176 | + "type": "text", |
| 177 | + "default": "/opt/ml/model/code", |
| 178 | + "scope": "container", |
| 179 | + }, |
| 180 | + { |
| 181 | + "name": "SAGEMAKER_CONTAINER_LOG_LEVEL", |
| 182 | + "type": "text", |
| 183 | + "default": "20", |
| 184 | + "scope": "container", |
| 185 | + }, |
| 186 | + { |
| 187 | + "name": "MODEL_CACHE_ROOT", |
| 188 | + "type": "text", |
| 189 | + "default": "/opt/ml/model", |
| 190 | + "scope": "container", |
| 191 | + }, |
| 192 | + {"name": "SAGEMAKER_ENV", "type": "text", "default": "1", "scope": "container"}, |
| 193 | + { |
| 194 | + "name": "SAGEMAKER_MODEL_SERVER_WORKERS", |
| 195 | + "type": "text", |
| 196 | + "default": "1", |
| 197 | + "scope": "container", |
| 198 | + }, |
| 199 | + { |
| 200 | + "name": "SAGEMAKER_MODEL_SERVER_TIMEOUT", |
| 201 | + "type": "text", |
| 202 | + "default": "3600", |
| 203 | + "scope": "container", |
| 204 | + }, |
| 205 | + ], |
121 | 206 | "inference_vulnerable": False,
|
122 | 207 | "inference_dependencies": [],
|
123 | 208 | "inference_vulnerabilities": [],
|
124 | 209 | "training_vulnerable": False,
|
125 | 210 | "training_dependencies": [],
|
126 | 211 | "training_vulnerabilities": [],
|
127 | 212 | "deprecated": False,
|
128 |
| - "default_inference_instance_type": "", |
129 |
| - "supported_inference_instance_types": None, |
130 | 213 | "default_training_instance_type": None,
|
131 | 214 | "supported_training_instance_types": [],
|
132 |
| - } |
| 215 | + "metrics": [], |
| 216 | + "default_inference_instance_type": "ml.g5.12xlarge", |
| 217 | + "supported_inference_instance_types": [ |
| 218 | + "ml.g5.12xlarge", |
| 219 | + "ml.g5.24xlarge", |
| 220 | + "ml.p3.8xlarge", |
| 221 | + "ml.p3.16xlarge", |
| 222 | + "ml.g4dn.12xlarge", |
| 223 | + ], |
| 224 | + }, |
133 | 225 | }
|
134 | 226 |
|
135 | 227 |
|
|
1214 | 1306 | "training_artifact_key": "pytorch-training/train-pytorch-ic-mobilenet-v2.tar.gz",
|
1215 | 1307 | "hosting_script_key": "source-directory-tarballs/pytorch/inference/ic/v1.0.0/sourcedir.tar.gz",
|
1216 | 1308 | "training_script_key": "source-directory-tarballs/pytorch/transfer_learning/ic/v1.0.0/sourcedir.tar.gz",
|
| 1309 | + "hosting_prepacked_artifact_key": None, |
1217 | 1310 | "hyperparameters": [
|
1218 | 1311 | {
|
1219 | 1312 | "name": "epochs",
|
|
0 commit comments