Skip to content

Commit

Permalink
Merge pull request #424 from grac3gao/update1127
Browse files Browse the repository at this point in the history
TCPXO new release
  • Loading branch information
grac3gao authored Dec 16, 2024
2 parents 1ddee13 + 4aeee0d commit 3140dbc
Show file tree
Hide file tree
Showing 4 changed files with 13 additions and 13 deletions.
2 changes: 1 addition & 1 deletion gpudirect-tcpxo/nccl-tcpxo-installer.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -69,7 +69,7 @@ spec:
chmod a+rw /dev/aperture_devices/*/resource*
fi
- name: nccl-tcpxo-installer
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
resources:
requests:
cpu: 150m
Expand Down
8 changes: 4 additions & 4 deletions gpudirect-tcpxo/nccl-test-latest.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -80,7 +80,7 @@ spec:
# dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -105,7 +105,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
# securityContext:
# privileged: true
Expand Down Expand Up @@ -210,7 +210,7 @@ spec:
# dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -235,7 +235,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
# securityContext:
# privileged: true
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -66,7 +66,7 @@ spec:
# dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -91,7 +91,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
# securityContext:
# privileged: true
Expand Down Expand Up @@ -196,7 +196,7 @@ spec:
# dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -221,7 +221,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
# securityContext:
# privileged: true
Expand Down
8 changes: 4 additions & 4 deletions gpudirect-tcpxo/nccl-test.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -41,7 +41,7 @@ spec:
dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -58,7 +58,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
command:
- /bin/sh
Expand Down Expand Up @@ -122,7 +122,7 @@ spec:
dnsPolicy: ClusterFirstWithHostNet
containers:
- name: tcpxo-daemon
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.12
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/tcpgpudmarxd-dev:v1.0.13_1
imagePullPolicy: Always
command: ["/bin/sh", "-c"]
args:
Expand All @@ -139,7 +139,7 @@ spec:
- name: LD_LIBRARY_PATH
value: /usr/local/nvidia/lib64
- name: nccl-test
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.6
image: us-docker.pkg.dev/gce-ai-infra/gpudirect-tcpxo/nccl-plugin-gpudirecttcpx-dev:v1.0.7
imagePullPolicy: Always
command:
- /bin/sh
Expand Down

0 comments on commit 3140dbc

Please sign in to comment.