Skip to content

Commit 6f852fd

Browse files
author
Artem Yushkovskiy
authored
Try fix apex non-working on all presets (#127)
1 parent 0e959e8 commit 6f852fd

File tree

2 files changed

+22
-2
lines changed

2 files changed

+22
-2
lines changed

Makefile

+18-2
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,11 @@ image_pip_list:
3232
e2e_neuro_push:
3333
neuro push $(IMAGE_NAME):built $(TEST_IMAGE)
3434

35+
36+
.PHONY: test_e2e
37+
test_e2e: test_e2e_pytorch test_e2e_tensorflow test_e2e_apex_gpu_small test_e2e_apex_gpu_large test_e2e_dependencies
38+
@echo "e2e tests succeeded!"
39+
3540
TEST_PRESET=cpu-small
3641
TEST_CMD=
3742
.PHONY: _test_e2e
@@ -46,14 +51,25 @@ _test_e2e:
4651

4752
.PHONY: test_e2e_pytorch
4853
test_e2e_pytorch: TEST_CMD=python /var/storage/gpu_pytorch.py
49-
test_e2e_pytorch: TEST_PRESET=gpu-small
54+
test_e2e_pytorch: TEST_PRESET=gpu-small-p
5055
test_e2e_pytorch: _test_e2e
5156

5257
.PHONY: test_e2e_tensorflow
5358
test_e2e_tensorflow: TEST_CMD=python /var/storage/gpu_tensorflow.py
54-
test_e2e_tensorflow: TEST_PRESET=gpu-small
59+
test_e2e_tensorflow: TEST_PRESET=gpu-small-p
5560
test_e2e_tensorflow: _test_e2e
5661

62+
.PHONY: test_e2e_apex_gpu_small
63+
test_e2e_apex_gpu_small: TEST_CMD=python /var/storage/gpu_apex.py
64+
test_e2e_apex_gpu_small: TEST_PRESET=gpu-small-p
65+
test_e2e_apex_gpu_small: _test_e2e
66+
test_e2e_tensorflow: _test_e2e
67+
68+
.PHONY: test_e2e_apex_gpu_large
69+
test_e2e_apex_gpu_large: TEST_CMD=python /var/storage/gpu_apex.py
70+
test_e2e_apex_gpu_large: TEST_PRESET=gpu-large-p
71+
test_e2e_apex_gpu_large: _test_e2e
72+
5773
.PHONY: test_e2e_dependencies
5874
test_e2e_dependencies: TEST_CMD=bash /var/storage/dependencies.sh
5975
test_e2e_dependencies: _test_e2e

targets/python37-jupyter-pytorch-tensorflow-jupyterlab/Dockerfile

+4
Original file line numberDiff line numberDiff line change
@@ -171,6 +171,10 @@ RUN APT_INSTALL="apt-get install -y --no-install-recommends" && \
171171
# Apex for PyTorch mixed precision training
172172
# ==================================================================
173173

174+
# problem: https://github.com/neuro-inc/ml-kinect-pose-estimation/issues/59
175+
# solution: https://github.com/NVIDIA/apex/issues/842
176+
ENV TORCH_CUDA_ARCH_LIST 6.0;7.0
177+
174178
# Somehow Apex does not use releases, and current master fails to build
175179
# (commit 1f2aa9156547377a023932a1512752c392d9bbdf on Apr 23, 2020).
176180
# So we fix installation to the version Apr 21, 2020

0 commit comments

Comments
 (0)