|
190 | 190 | "framework_version": "1.5.0",
|
191 | 191 | "py_version": "py3",
|
192 | 192 | },
|
193 |
| - "hosting_instance_type_variants": { |
194 |
| - "regional_aliases": { |
195 |
| - "us-west-2": { |
196 |
| - "gpu_image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/" |
197 |
| - "huggingface-pytorch-inference:1.13.1-transformers4.26.0-gpu-py39-cu117-ubuntu20.04", |
198 |
| - "cpu_image_uri": "867930986793.dkr.us-west-2.amazonaws.com/cpu-blah", |
199 |
| - "inf_model_package_arn": "us-west-2/blah/blah/blah/inf", |
200 |
| - "gpu_model_package_arn": "us-west-2/blah/blah/blah/gpu", |
201 |
| - } |
202 |
| - }, |
203 |
| - "variants": { |
204 |
| - "p2": { |
205 |
| - "regional_properties": { |
206 |
| - "image_uri": "$gpu_image_uri", |
207 |
| - "model_package_arn": "$gpu_model_package_arn", |
208 |
| - } |
209 |
| - }, |
210 |
| - "p3": { |
211 |
| - "regional_properties": { |
212 |
| - "image_uri": "$gpu_image_uri", |
213 |
| - "model_package_arn": "$gpu_model_package_arn", |
214 |
| - } |
215 |
| - }, |
216 |
| - "p4": { |
217 |
| - "regional_properties": { |
218 |
| - "image_uri": "$gpu_image_uri", |
219 |
| - "model_package_arn": "$gpu_model_package_arn", |
220 |
| - } |
221 |
| - }, |
222 |
| - "g4dn": { |
223 |
| - "regional_properties": { |
224 |
| - "image_uri": "$gpu_image_uri", |
225 |
| - "model_package_arn": "$gpu_model_package_arn", |
226 |
| - } |
227 |
| - }, |
228 |
| - "m2": {"regional_properties": {"image_uri": "$cpu_image_uri"}}, |
229 |
| - "c2": {"regional_properties": {"image_uri": "$cpu_image_uri"}}, |
230 |
| - "ml.g5.48xlarge": { |
231 |
| - "properties": {"environment_variables": {"TENSOR_PARALLEL_DEGREE": "8"}} |
232 |
| - }, |
233 |
| - "ml.g5.12xlarge": { |
234 |
| - "properties": {"environment_variables": {"TENSOR_PARALLEL_DEGREE": "4"}} |
235 |
| - }, |
236 |
| - "inf1": {"regional_properties": {"model_package_arn": "$inf_model_package_arn"}}, |
237 |
| - "inf2": {"regional_properties": {"model_package_arn": "$inf_model_package_arn"}}, |
238 |
| - }, |
239 |
| - }, |
240 |
| - "training_ecr_specs": { |
241 |
| - "framework": "pytorch", |
242 |
| - "framework_version": "1.5.0", |
243 |
| - "py_version": "py3", |
244 |
| - }, |
245 | 193 | "training_instance_type_variants": {
|
| 194 | + "regional_aliases": {}, |
246 | 195 | "variants": {
|
247 | 196 | "ml.p2.12xlarge": {
|
248 | 197 | "properties": {
|
|
305 | 254 | "scope": "algorithm",
|
306 | 255 | },
|
307 | 256 | ],
|
| 257 | + "metrics": [ |
| 258 | + { |
| 259 | + "Name": "huggingface-textgeneration:instance-typemetric-loss", |
| 260 | + "Regex": "'eval_loss': ([0-9]+\\.[0-9]+)", |
| 261 | + }, |
| 262 | + { |
| 263 | + "Name": "huggingface-textgeneration:eval-loss", |
| 264 | + "Regex": "'eval_loss': ([0-9]+\\.[0-9]+)", |
| 265 | + }, |
| 266 | + { |
| 267 | + "Name": "huggingface-textgeneration:train-loss", |
| 268 | + "Regex": "'instance type specific': ([0-9]+\\.[0-9]+)", |
| 269 | + }, |
| 270 | + { |
| 271 | + "Name": "huggingface-textgeneration:noneyourbusiness-loss", |
| 272 | + "Regex": "'loss-noyb instance specific': ([0-9]+\\.[0-9]+)", |
| 273 | + }, |
| 274 | + ], |
308 | 275 | }
|
309 | 276 | },
|
310 | 277 | "p2": {
|
| 278 | + "regional_properties": {"image_uri": "$gpu_ecr_uri_2"}, |
311 | 279 | "properties": {
|
312 | 280 | "hyperparameters": [
|
313 | 281 | {
|
|
372 | 340 | "default": "20",
|
373 | 341 | "scope": "container",
|
374 | 342 | },
|
375 |
| - ] |
| 343 | + ], |
| 344 | + "metrics": [ |
| 345 | + { |
| 346 | + "Name": "huggingface-textgeneration:wtafigo", |
| 347 | + "Regex": "'evasadfasdl_loss': ([0-9]+\\.[0-9]+)", |
| 348 | + }, |
| 349 | + { |
| 350 | + "Name": "huggingface-textgeneration:eval-loss", |
| 351 | + "Regex": "'eval_loss': ([0-9]+\\.[0-9]+)", |
| 352 | + }, |
| 353 | + { |
| 354 | + "Name": "huggingface-textgeneration:train-loss", |
| 355 | + "Regex": "'instance family specific': ([0-9]+\\.[0-9]+)", |
| 356 | + }, |
| 357 | + { |
| 358 | + "Name": "huggingface-textgeneration:noneyourbusiness-loss", |
| 359 | + "Regex": "'loss-noyb': ([0-9]+\\.[0-9]+)", |
| 360 | + }, |
| 361 | + ], |
| 362 | + }, |
| 363 | + }, |
| 364 | + }, |
| 365 | + }, |
| 366 | + "hosting_instance_type_variants": { |
| 367 | + "regional_aliases": { |
| 368 | + "us-west-2": { |
| 369 | + "gpu_image_uri": "763104351884.dkr.ecr.us-west-2.amazonaws.com/" |
| 370 | + "huggingface-pytorch-inference:1.13.1-transformers4.26.0-gpu-py39-cu117-ubuntu20.04", |
| 371 | + "cpu_image_uri": "867930986793.dkr.us-west-2.amazonaws.com/cpu-blah", |
| 372 | + "inf_model_package_arn": "us-west-2/blah/blah/blah/inf", |
| 373 | + "gpu_model_package_arn": "us-west-2/blah/blah/blah/gpu", |
| 374 | + } |
| 375 | + }, |
| 376 | + "variants": { |
| 377 | + "p2": { |
| 378 | + "regional_properties": { |
| 379 | + "image_uri": "$gpu_image_uri", |
| 380 | + "model_package_arn": "$gpu_model_package_arn", |
376 | 381 | }
|
377 | 382 | },
|
378 |
| - } |
| 383 | + "p3": { |
| 384 | + "regional_properties": { |
| 385 | + "image_uri": "$gpu_image_uri", |
| 386 | + "model_package_arn": "$gpu_model_package_arn", |
| 387 | + } |
| 388 | + }, |
| 389 | + "p4": { |
| 390 | + "regional_properties": { |
| 391 | + "image_uri": "$gpu_image_uri", |
| 392 | + "model_package_arn": "$gpu_model_package_arn", |
| 393 | + } |
| 394 | + }, |
| 395 | + "g4dn": { |
| 396 | + "regional_properties": { |
| 397 | + "image_uri": "$gpu_image_uri", |
| 398 | + "model_package_arn": "$gpu_model_package_arn", |
| 399 | + } |
| 400 | + }, |
| 401 | + "m2": {"regional_properties": {"image_uri": "$cpu_image_uri"}}, |
| 402 | + "c2": {"regional_properties": {"image_uri": "$cpu_image_uri"}}, |
| 403 | + "ml.g5.48xlarge": { |
| 404 | + "properties": {"environment_variables": {"TENSOR_PARALLEL_DEGREE": "8"}} |
| 405 | + }, |
| 406 | + "ml.g5.12xlarge": { |
| 407 | + "properties": {"environment_variables": {"TENSOR_PARALLEL_DEGREE": "4"}} |
| 408 | + }, |
| 409 | + "inf1": {"regional_properties": {"model_package_arn": "$inf_model_package_arn"}}, |
| 410 | + "inf2": {"regional_properties": {"model_package_arn": "$inf_model_package_arn"}}, |
| 411 | + }, |
| 412 | + }, |
| 413 | + "training_ecr_specs": { |
| 414 | + "framework": "pytorch", |
| 415 | + "framework_version": "1.5.0", |
| 416 | + "py_version": "py3", |
379 | 417 | },
|
380 | 418 | "hosting_artifact_key": "pytorch-infer/infer-pytorch-ic-mobilenet-v2.tar.gz",
|
381 | 419 | "training_artifact_key": "pytorch-training/train-pytorch-ic-mobilenet-v2.tar.gz",
|
|
515 | 553 | "ml.c5.2xlarge",
|
516 | 554 | ],
|
517 | 555 | "hosting_use_script_uri": True,
|
518 |
| - "metrics": [{"Regex": "val_accuracy: ([0-9\\.]+)", "Name": "pytorch-ic:val-accuracy"}], |
| 556 | + "metrics": [ |
| 557 | + { |
| 558 | + "Name": "huggingface-textgeneration:train-loss", |
| 559 | + "Regex": "'loss default': ([0-9]+\\.[0-9]+)", |
| 560 | + }, |
| 561 | + { |
| 562 | + "Name": "huggingface-textgeyyyuyuyuyneration:train-loss", |
| 563 | + "Regex": "'loss default': ([0-9]+\\.[0-9]+)", |
| 564 | + }, |
| 565 | + ], |
519 | 566 | "model_kwargs": {"some-model-kwarg-key": "some-model-kwarg-value"},
|
520 | 567 | "deploy_kwargs": {"some-model-deploy-kwarg-key": "some-model-deploy-kwarg-value"},
|
521 | 568 | "estimator_kwargs": {
|
|
0 commit comments