From 62eb72db80a02fbbf82c08a781472898f3858783 Mon Sep 17 00:00:00 2001 From: Dillon Erb <585865+dte@users.noreply.github.com> Date: Mon, 30 Dec 2019 20:08:43 -0500 Subject: [PATCH 1/4] Update to GradientCI 2 --- .ps_project/config.yaml | 49 ++++++++++++++++------------------------- 1 file changed, 19 insertions(+), 30 deletions(-) diff --git a/.ps_project/config.yaml b/.ps_project/config.yaml index 4afda3c..bfb022c 100644 --- a/.ps_project/config.yaml +++ b/.ps_project/config.yaml @@ -1,30 +1,19 @@ -version: 1 -type: "multi-grpc" -ports: "5000" -filters: - tags: - only: 'v.*' - branches: - only: '.*' -parameter-server: - container: "tensorflow/tensorflow:1.13.1-py3" - command: "pip install -r requirements.txt && python mnist.py" - machine-type: "G1" - count: 1 -worker: - container: "tensorflow/tensorflow:1.13.1-gpu-py3" - command: "pip install -r requirements.txt && python mnist.py" - machine-type: "K80" - count: 2 -model: - type: Tensorflow - path: '/artifacts' -checks: - tensorflow:loss: - target: 0.0..1.0 - aggregate: max - tensorflow:accuracy: - target: 0.988..1.000 - aggregate: median - defaults: - precision: 3 +version: 2 + +workflows: + single-node: + steps: + - + name: "single-node" + command: experiment.run_multi_node + params: + workerCommand: nvidia-smi + workerMachineType: "K80" + workerWorkingDirectory: "/home/playground" + workerArtifactDirectory: "/artifacts" + workerContainer: tensorflow/tensorflow:1.13.1-gpu-py3 + parameterServerCommand: nvidia-smi + parameterServerMachineType: "K80" + parameterServerWorkingDirectory: "/home/playground" + parameterServerArtifactDirectory: "/artifacts" + parameterServerContainer: tensorflow/tensorflow:1.13.1-gpu-py3 From d360f0ad1821ca30bdeecb1fe2134ddc1c737043 Mon Sep 17 00:00:00 2001 From: Dillon Erb <585865+dte@users.noreply.github.com> Date: Mon, 30 Dec 2019 20:12:34 -0500 Subject: [PATCH 2/4] Update config.yaml --- .ps_project/config.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.ps_project/config.yaml b/.ps_project/config.yaml index bfb022c..b40793a 100644 --- a/.ps_project/config.yaml +++ b/.ps_project/config.yaml @@ -4,7 +4,7 @@ workflows: single-node: steps: - - name: "single-node" + name: "multi-node" command: experiment.run_multi_node params: workerCommand: nvidia-smi From d7edb7abca8c31ba968ec59d16c0d517f7719a34 Mon Sep 17 00:00:00 2001 From: Dillon Erb <585865+dte@users.noreply.github.com> Date: Thu, 2 Jan 2020 16:47:56 -0500 Subject: [PATCH 3/4] Update config.yaml --- .ps_project/config.yaml | 38 ++++++++++++++++++++++++++------------ 1 file changed, 26 insertions(+), 12 deletions(-) diff --git a/.ps_project/config.yaml b/.ps_project/config.yaml index b40793a..9f97614 100644 --- a/.ps_project/config.yaml +++ b/.ps_project/config.yaml @@ -1,19 +1,33 @@ version: 2 - workflows: - single-node: + ci-test: steps: - - name: "multi-node" + name: "my experiment" command: experiment.run_multi_node params: - workerCommand: nvidia-smi + ports: "5000" + modelPath: "/artifacts" + modelType: "Tensorflow" + workerCommand: "pip install -r requirements.txt && python mnist.py" + workerContainer: "tensorflow/tensorflow:1.13.1-gpu-py3" workerMachineType: "K80" - workerWorkingDirectory: "/home/playground" - workerArtifactDirectory: "/artifacts" - workerContainer: tensorflow/tensorflow:1.13.1-gpu-py3 - parameterServerCommand: nvidia-smi - parameterServerMachineType: "K80" - parameterServerWorkingDirectory: "/home/playground" - parameterServerArtifactDirectory: "/artifacts" - parameterServerContainer: tensorflow/tensorflow:1.13.1-gpu-py3 + workerCount: 2 + parameterServerCount: 1 + parameterServerCommand: "pip install -r requirements.txt && python mnist.py" + parameterServerContainer: "tensorflow/tensorflow:1.13.1-py3" + parameterServerMachineType: "G1" + checks: + tensorflow:loss: + target: 0.0..1.0 + aggregate: max + tensorflow:accuracy: + target: 0.988..1.000 + aggregate: median + defaults: + precision: 3 + triggers: + tags: + only: 'v.*' + branches: + only: '.*' From 443cde234e66bd63f75f142ef9a05bc6a33d998b Mon Sep 17 00:00:00 2001 From: Dillon Erb <585865+dte@users.noreply.github.com> Date: Mon, 13 Jan 2020 15:49:17 -0500 Subject: [PATCH 4/4] Update config.yaml