Skip to content

Commit

Permalink
Signed-off-by: limengxuan <[email protected]>
Browse files Browse the repository at this point in the history
update vgpu part of device-plugin
  • Loading branch information
archlitchi committed Apr 11, 2024
1 parent 4d51c23 commit 24caf8e
Show file tree
Hide file tree
Showing 5 changed files with 3 additions and 29 deletions.
4 changes: 2 additions & 2 deletions .github/workflows/main.yml
Original file line number Diff line number Diff line change
Expand Up @@ -3,9 +3,9 @@ on:
push:
tags:
- v[0-9]+.[0-9]+.[0-9]+
branches: [master,dev-vgpu-1219]
branches: [master]
pull_request:
branches: [master,dev-vgpu-1219]
branches: [master]

jobs:
build:
Expand Down
1 change: 0 additions & 1 deletion docker/amd64/Dockerfile.vgpu-ubuntu20.04
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,5 @@ ENV NVIDIA_DRIVER_CAPABILITIES=utility

COPY --from=build /go/src/volcano.sh/devices/volcano-vgpu-device-plugin /usr/bin/volcano-vgpu-device-plugin
RUN mkdir -p /k8s-vgpu/lib/nvidia
COPY --from=build /go/src/volcano.sh/devices/lib/* /k8s-vgpu/lib/nvidia/

ENTRYPOINT ["volcano-vgpu-device-plugin"]
1 change: 0 additions & 1 deletion lib/ld.so.preload

This file was deleted.

Binary file removed lib/libvgpu.so
Binary file not shown.
26 changes: 1 addition & 25 deletions pkg/plugin/vgpu/plugin.go
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,6 @@ import (
"strings"
"time"

"k8s.io/apimachinery/pkg/util/uuid"
"k8s.io/klog/v2"
"volcano.sh/k8s-device-plugin/pkg/lock"
"volcano.sh/k8s-device-plugin/pkg/plugin/vgpu/config"
Expand Down Expand Up @@ -310,7 +309,7 @@ func (m *NvidiaDevicePlugin) Allocate(ctx context.Context, reqs *pluginapi.Alloc
}

for idx := range reqs.ContainerRequests {
currentCtr, devreq, err := util.GetNextDeviceRequest(util.NvidiaGPUDevice, *current)
_, devreq, err := util.GetNextDeviceRequest(util.NvidiaGPUDevice, *current)
klog.Infoln("deviceAllocateFromAnnotation=", devreq)
if err != nil {
klog.Errorln("get device from annotation failed", err.Error())
Expand Down Expand Up @@ -342,29 +341,6 @@ func (m *NvidiaDevicePlugin) Allocate(ctx context.Context, reqs *pluginapi.Alloc
response.Envs["NVIDIA_VISIBLE_DEVICES"] = dev.UUID
}
}
response.Envs["CUDA_DEVICE_MEMORY_SHARED_CACHE"] = fmt.Sprintf("/tmp/vgpu/%v.cache", uuid.NewUUID())

cacheFileHostDirectory := "/tmp/vgpu/containers/" + string(current.UID) + "_" + currentCtr.Name
os.MkdirAll(cacheFileHostDirectory, 0777)
os.Chmod(cacheFileHostDirectory, 0777)
os.MkdirAll("/tmp/vgpulock", 0777)
os.Chmod("/tmp/vgpulock", 0777)
hostHookPath := os.Getenv("HOOK_PATH")
response.Mounts = append(response.Mounts,
&pluginapi.Mount{ContainerPath: "/usr/local/vgpu/libvgpu.so",
HostPath: hostHookPath + "/libvgpu.so",
ReadOnly: true},
&pluginapi.Mount{ContainerPath: "/etc/ld.so.preload",
HostPath: hostHookPath + "/ld.so.preload",
ReadOnly: true},
&pluginapi.Mount{ContainerPath: "/tmp/vgpu",
HostPath: cacheFileHostDirectory,
ReadOnly: false},
&pluginapi.Mount{ContainerPath: "/tmp/vgpulock",
HostPath: "/tmp/vgpulock",
ReadOnly: false},
)
responses.ContainerResponses = append(responses.ContainerResponses, &response)
}
klog.Infoln("Allocate Response", responses.ContainerResponses)
util.PodAllocationTrySuccess(nodename, current)
Expand Down

0 comments on commit 24caf8e

Please sign in to comment.