|
1 | 1 | { |
2 | | - "jobid": "84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
| 2 | + "jobid": "87ed37bc-a837-4f20-aad0-0a12754452f4", |
3 | 3 | "cmdline": { |
4 | | - "appPart": "python3 tmp-3113-RmwfLb44cTU3 -v -b ${S3_BUCKET} -m ${S3_OBJECTMODEL} -g ${S3_OBJECTGLUEDATA} -t WNLI -M -s 40 41 42 43", |
5 | | - "systemPart": "ray job submit --runtime-env=/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-3113-8BRkUtu0rNmo --job-id ${JOB_ID} --no-wait" |
| 4 | + "appPart": "python3 tmp-39715-vOKRmyNRUiZ6 -v -b ${S3_BUCKET} -m ${S3_OBJECTMODEL} -g ${S3_OBJECTGLUEDATA} -t WNLI -M -s 40 41 42 43", |
| 5 | + "systemPart": "ray job submit --runtime-env=/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-39715-KyWwb7w9Tliq --job-id ${JOB_ID} --no-wait" |
6 | 6 | }, |
7 | 7 | "runtimeEnv": { |
8 | 8 | "env_vars": { |
9 | | - "JOB_ID": "84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
| 9 | + "JOB_ID": "87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 10 | + "S3_PROVIDER": "aws", |
10 | 11 | "S3_ENDPOINT": "https://s3.amazonaws.com", |
11 | 12 | "S3_ACCESS_KEY_ID": "********", |
12 | 13 | "AWS_ACCESS_KEY_ID": "********", |
13 | 14 | "S3_SECRET_ACCESS_KEY": "********", |
14 | 15 | "AWS_SECRET_ACCESS_KEY": "********", |
15 | | - "MC_CONFIG_DIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.VAPQnMBX", |
| 16 | + "MC_CONFIG_DIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.NOeQ5szv", |
16 | 17 | "S3_BUCKETRAYLOGS": "browsey", |
17 | 18 | "S3_FILEPATHRAYLOGS": "RAYLOGS", |
18 | | - "S3_LOGDIR": "browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
19 | | - "LOGDIR_STAGE": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0", |
20 | | - "LOGDIR_URI": "s3://browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
21 | | - "LOGDIR_MC": "s3/browsey/codeflare/84d94981-8197-4bfd-a0a3-a93dd67dc2b7", |
22 | | - "STREAMCONSUMER_LOGS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/logs/", |
23 | | - "STREAMCONSUMER_EVENTS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/events/", |
24 | | - "STREAMCONSUMER_RESOURCES": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.Vqva5wI0/resources/", |
| 19 | + "S3_LOGDIR": "browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 20 | + "LOGDIR_STAGE": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg", |
| 21 | + "LOGDIR_URI": "s3://browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 22 | + "LOGDIR_MC": "s3/browsey/codeflare/87ed37bc-a837-4f20-aad0-0a12754452f4", |
| 23 | + "STREAMCONSUMER_LOGS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/logs/", |
| 24 | + "STREAMCONSUMER_EVENTS": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/events/", |
| 25 | + "STREAMCONSUMER_RESOURCES": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/logdir-stage.n2ngzgZg/resources/", |
25 | 26 | "KUBE_CONTEXT": "default/api-codeflare-train-v11-codeflare-openshift-com:6443/kube:admin", |
26 | 27 | "KUBE_NS": "nvidia-gpu-operator", |
27 | 28 | "NUM_CPUS": "1", |
|
30 | 31 | "MAX_WORKERS": "1", |
31 | 32 | "WORKER_MEMORY": "32Gi", |
32 | 33 | "HEAD_MEMORY": "32Gi", |
| 34 | + "RAY_OPERATOR_IMAGE": "rayproject/ray:1.13.0-py37", |
| 35 | + "RAY_IMAGE": "rayproject/ray-ml:1.13.0-py37-gpu", |
| 36 | + "HELM_CLONE_TEMPDIR": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp.VerQFNF6", |
33 | 37 | "RAY_KUBE_CLUSTER_NAME": "mycluster", |
| 38 | + "KUBE_POD_LABEL_SELECTOR": "ray-user-node-type=rayWorkerType", |
| 39 | + "KUBE_PODFULL_LABEL_SELECTOR": "ray-node-type", |
34 | 40 | "RAY_KUBE_PORT": "8266", |
35 | 41 | "RAY_ADDRESS": "http://127.0.0.1:8266", |
36 | | - "KUBE_POD_LABEL_SELECTOR": "ray-user-node-type=rayWorkerType", |
37 | 42 | "S3_BUCKET": "browsey", |
38 | 43 | "S3_FILEPATH": "browsey", |
39 | 44 | "S3_OBJECTMODEL": "roberta-base", |
|
43 | 48 | "WANDB_CONFIG_DIR": "/tmp", |
44 | 49 | "WANDB_DISABLED": "true" |
45 | 50 | }, |
46 | | - "working_dir": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-3113-ma7eFXGAJZjS", |
| 51 | + "working_dir": "/var/folders/2k/7mgd1tq55gdbghf0xkl2t_l80000gp/T/tmp-39715-QAaimTMZf5wC", |
47 | 52 | "pip": ["boto3", "ray[default]", "ray_lightning", "pytorch_lightning", "torchvision", "transformers==3.0.2"] |
48 | 53 | }, |
49 | 54 | "language": "python", |
|
0 commit comments