|
1 | 1 | {
|
2 |
| - "jobid": "84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
| 2 | + "jobid": "87ed37bc-a837-4f20-aad0-0a12754452f4", |
3 | 3 | "cmdline": {
|
4 |
| - "appPart": "python3 tmp-3113-RmwfLb44cTU3 -v -b ${S3_BUCKET} -m ${S3_OBJECTMODEL} -g ${S3_OBJECTGLUEDATA} -t WNLI -M -s 40 41 42 43", |
5 |
| - "systemPart": "ray job submit --runtime-env=/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-3113-8BRkUtu0rNmo --job-id ${JOB_ID} --no-wait" |
| 4 | + "appPart": "python3 tmp-39715-vOKRmyNRUiZ6 -v -b ${S3_BUCKET} -m ${S3_OBJECTMODEL} -g ${S3_OBJECTGLUEDATA} -t WNLI -M -s 40 41 42 43", |
| 5 | + "systemPart": "ray job submit --runtime-env=/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-39715-KyWwb7w9Tliq --job-id ${JOB_ID} --no-wait" |
6 | 6 | },
|
7 | 7 | "runtimeEnv": {
|
8 | 8 | "env_vars": {
|
9 |
| - "JOB_ID": "84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
| 9 | + "JOB_ID": "87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 10 | + "S3_PROVIDER": "aws", |
10 | 11 | "S3_ENDPOINT": "https://s3.amazonaws.com",
|
11 | 12 | "S3_ACCESS_KEY_ID": "********",
|
12 | 13 | "AWS_ACCESS_KEY_ID": "********",
|
13 | 14 | "S3_SECRET_ACCESS_KEY": "********",
|
14 | 15 | "AWS_SECRET_ACCESS_KEY": "********",
|
15 |
| - "MC_CONFIG_DIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.VAPQnMBX", |
| 16 | + "MC_CONFIG_DIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.NOeQ5szv", |
16 | 17 | "S3_BUCKETRAYLOGS": "browsey",
|
17 | 18 | "S3_FILEPATHRAYLOGS": "RAYLOGS",
|
18 |
| - "S3_LOGDIR": "browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
19 |
| - "LOGDIR_STAGE": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0", |
20 |
| - "LOGDIR_URI": "s3://browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
21 |
| - "LOGDIR_MC": "s3/browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
22 |
| - "STREAMCONSUMER_LOGS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/logs/", |
23 |
| - "STREAMCONSUMER_EVENTS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/events/", |
24 |
| - "STREAMCONSUMER_RESOURCES": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/resources/", |
| 19 | + "S3_LOGDIR": "browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 20 | + "LOGDIR_STAGE": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg", |
| 21 | + "LOGDIR_URI": "s3://browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 22 | + "LOGDIR_MC": "s3/browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 23 | + "STREAMCONSUMER_LOGS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/logs/", |
| 24 | + "STREAMCONSUMER_EVENTS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/events/", |
| 25 | + "STREAMCONSUMER_RESOURCES": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/resources/", |
25 | 26 | "KUBE_CONTEXT": "default/api-codeflare-train-v11-codeflare-openshift-com:6443/kube:admin",
|
26 | 27 | "KUBE_NS": "nvidia-gpu-operator",
|
27 | 28 | "NUM_CPUS": "1",
|
|
30 | 31 | "MAX_WORKERS": "1",
|
31 | 32 | "WORKER_MEMORY": "32Gi",
|
32 | 33 | "HEAD_MEMORY": "32Gi",
|
| 34 | + "RAY_OPERATOR_IMAGE": "rayproject/ray:1.13.0-py37", |
| 35 | + "RAY_IMAGE": "rayproject/ray-ml:1.13.0-py37-gpu", |
| 36 | + "HELM_CLONE_TEMPDIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.VerQFNF6", |
33 | 37 | "RAY_KUBE_CLUSTER_NAME": "mycluster",
|
| 38 | + "KUBE_POD_LABEL_SELECTOR": "ray-user-node-type=rayWorkerType", |
| 39 | + "KUBE_PODFULL_LABEL_SELECTOR": "ray-node-type", |
34 | 40 | "RAY_KUBE_PORT": "8266",
|
35 | 41 | "RAY_ADDRESS": "http://127.0.0.1:8266",
|
36 |
| - "KUBE_POD_LABEL_SELECTOR": "ray-user-node-type=rayWorkerType", |
37 | 42 | "S3_BUCKET": "browsey",
|
38 | 43 | "S3_FILEPATH": "browsey",
|
39 | 44 | "S3_OBJECTMODEL": "roberta-base",
|
|
43 | 48 | "WANDB_CONFIG_DIR": "/tmp",
|
44 | 49 | "WANDB_DISABLED": "true"
|
45 | 50 | },
|
46 |
| - "working_dir": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-3113-ma7eFXGAJZjS", |
| 51 | + "working_dir": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-39715-QAaimTMZf5wC", |
47 | 52 | "pip": ["boto3", "ray[default]", "ray_lightning", "pytorch_lightning", "torchvision", "transformers==3.0.2"]
|
48 | 53 | },
|
49 | 54 | "language": "python",
|
|
0 commit comments