==== inspect 4437513a0a7d [ { "Id": "4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f", "Created": "2025-09-16T03:25:53.878986996Z", "Path": "/opt/nvidia/nvidia_entrypoint.sh", "Args": [ "/usr/sbin/sshd", "-D", "-p", "60023" ], "State": { "Status": "running", "Running": true, "Paused": false, "Restarting": false, "OOMKilled": false, "Dead": false, "Pid": 743280, "ExitCode": 0, "Error": "", "StartedAt": "2025-09-16T03:25:54.545313855Z", "FinishedAt": "0001-01-01T00:00:00Z" }, "Image": "sha256:70d86cd3508242f1eb743722ff7b8917e7a8e7ff2dc9a215ea44530cad69c2b8", "ResolvConfPath": "/var/lib/docker/containers/4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f/resolv.conf", "HostnamePath": "/var/lib/docker/containers/4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f/hostname", "HostsPath": "/var/lib/docker/containers/4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f/hosts", "LogPath": "/var/lib/docker/containers/4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f/4437513a0a7db8fa2df52b9f8ab888d1d4684d53cd47ecc60884f3132fd6e20f-json.log", "Name": "/nccl-test", "RestartCount": 0, "Driver": "overlay2", "Platform": "linux", "MountLabel": "", "ProcessLabel": "", "AppArmorProfile": "unconfined", "ExecIDs": null, "HostConfig": { "Binds": [ "/public/devops:/devops", "/data:/data" ], "ContainerIDFile": "", "LogConfig": { "Type": "json-file", "Config": {} }, "NetworkMode": "host", "PortBindings": {}, "RestartPolicy": { "Name": "always", "MaximumRetryCount": 0 }, "AutoRemove": false, "VolumeDriver": "", "VolumesFrom": null, "ConsoleSize": [ 0, 0 ], "CapAdd": null, "CapDrop": null, "CgroupnsMode": "private", "Dns": [], "DnsOptions": [], "DnsSearch": [], "ExtraHosts": null, "GroupAdd": null, "IpcMode": "host", "Cgroup": "", "Links": null, "OomScoreAdj": 0, "PidMode": "", "Privileged": true, "PublishAllPorts": false, "ReadonlyRootfs": false, "SecurityOpt": [ "label=disable" ], "UTSMode": "", "UsernsMode": "", "ShmSize": 549755813888, "Runtime": "runc", "Isolation": "", "CpuShares": 0, "Memory": 0, "NanoCpus": 0, "CgroupParent": "", "BlkioWeight": 0, "BlkioWeightDevice": [], "BlkioDeviceReadBps": [], "BlkioDeviceWriteBps": [], "BlkioDeviceReadIOps": [], "BlkioDeviceWriteIOps": [], "CpuPeriod": 0, "CpuQuota": 0, "CpuRealtimePeriod": 0, "CpuRealtimeRuntime": 0, "CpusetCpus": "", "CpusetMems": "", "Devices": [ { "PathOnHost": "/dev/infiniband", "PathInContainer": "/dev/infiniband", "CgroupPermissions": "rwm" } ], "DeviceCgroupRules": null, "DeviceRequests": [ { "Driver": "", "Count": -1, "DeviceIDs": null, "Capabilities": [ [ "gpu" ] ], "Options": {} } ], "MemoryReservation": 0, "MemorySwap": 0, "MemorySwappiness": null, "OomKillDisable": null, "PidsLimit": null, "Ulimits": [ { "Name": "memlock", "Hard": -1, "Soft": -1 } ], "CpuCount": 0, "CpuPercent": 0, "IOMaximumIOps": 0, "IOMaximumBandwidth": 0, "MaskedPaths": null, "ReadonlyPaths": null }, "GraphDriver": { "Data": { "LowerDir": "/var/lib/docker/overlay2/f86fbf0f96243c4b9ca7869879e5dd4f2ffd11fd9fccf005965a9b43ae7acdfa-init/diff:/var/lib/docker/overlay2/e606cbdc8fbf731e241e1848c9bcf050a86fcd66d4ba1c960beaff5ea0b51d21/diff:/var/lib/docker/overlay2/4cefcb3a5435947ad5ca474160699def4dbcc74210421dc2e2f1fe39f5ec20b1/diff:/var/lib/docker/overlay2/885731c4400b72652eb1d4945f28ae72d849f7e2552b8bd0a9074812906d39fa/diff:/var/lib/docker/overlay2/f9bc2dd3ae1ad5bfd001fed32b4a7e352b152e4fd2571bbfd7b03a6e2e3ad92d/diff:/var/lib/docker/overlay2/12ee4e26ace61b2751c3ebbfbd410b8b6f47bcca0940368acbbf70aba3ae7e43/diff:/var/lib/docker/overlay2/d3a6c9faa387fcbea143116c7283b86ecbc8334a882f4e80539fdf52129db25a/diff:/var/lib/docker/overlay2/6f428eb8f5d9659978fe0872936b1ea30d3230e62cb96c725726faa5b29bf204/diff:/var/lib/docker/overlay2/ea116100ce6c8f8b6fb115e9340264b6a9a2f7b18a41a5f10fc54cdf691c7c12/diff:/var/lib/docker/overlay2/ebf55f4625cb5724c3aca6635f2e2aa7c193b2a33cfb4df1a7ac19aeba8b226b/diff:/var/lib/docker/overlay2/56b7cc043eb085c0f2b5ed0bd29ba71c0ff7ad9a467ea8922e54f7126f4e1b78/diff:/var/lib/docker/overlay2/57b50509cb5c63293bebd3cdf971e43f4d97ea11bc662055f64f7c528397c59d/diff:/var/lib/docker/overlay2/82b9295b67726f908fa9745bdf72c788f1562d0cf979b62dbd3f54b947fc5fff/diff:/var/lib/docker/overlay2/f8e8ac55249125af25961c3853ed5f1990f628a67bab4a1e05d7c059aeec9599/diff:/var/lib/docker/overlay2/257495456fc24b866c1772e11b35d72ef8f87a5dc190d1fb12969c49af5eda33/diff:/var/lib/docker/overlay2/49b2f89be0b9fdc2e9eba76b9b20b836d40a79cf09f0d7b2c1321ee3481b0ce3/diff:/var/lib/docker/overlay2/e619f8a72f8e03275e6c3c18583b3a5f1d5ff09d15828d821478acec3f08f889/diff:/var/lib/docker/overlay2/caed4dac8802718d6e666f69010da0c72887042f43868cc9926ae74637757ed5/diff:/var/lib/docker/overlay2/18dd9b9ec24a477c98f1f4ae7bddd2818bc4e89713da5daec7832d1eba442327/diff:/var/lib/docker/overlay2/0c6de675d6f4ee17cf3ab5f293e9096f42514961f5cab35027159ae26dd5e4d1/diff:/var/lib/docker/overlay2/b8c42196d22871c573536a035d5ff1f71f7a892c63cee334065e7a199d6c343c/diff:/var/lib/docker/overlay2/96639d5ba7974706d6f341300b3987b7a8cf7ed1b639c64954a9e0172d6408e6/diff:/var/lib/docker/overlay2/47cb3df31f6b524ae852002243c3fee74c56bf77de022ac0a62e9197c71db6f8/diff:/var/lib/docker/overlay2/4313ff1ff783c606b409b9a7a9399d71d6df27846fc5010cd1fe972b44f9269b/diff:/var/lib/docker/overlay2/2c6e05c9909484676d6f3015a0fa7147c34d2df354179fbc02048e29ecd3f537/diff:/var/lib/docker/overlay2/e642ad0310f73a70d12633197cdbabf58932e2026e2ed85925345d595b98dd81/diff:/var/lib/docker/overlay2/70915c1320b739faf6b59d2a10906799d6b80fb184bc5c9f9c54cb0401f6241a/diff:/var/lib/docker/overlay2/ddc6c0796bfbf44e1b798d1c9e6d7995b4e7fa35a07e79104b6f92d8e249f63f/diff:/var/lib/docker/overlay2/8c59089eddd1a63a67363a0ea114eae7e744fd2de9ecb77758b275409e81f07d/diff:/var/lib/docker/overlay2/ce37b396a75e2fa5776eed0d5c872f5585994bd65dc884005a88fd8b2a3b2de4/diff:/var/lib/docker/overlay2/d8775c66baa813e91ca7e44847aafd75f3c02462ccf4567ddb6ed18dc41f0c53/diff:/var/lib/docker/overlay2/cb0eb3ebf7c380868b9a0b98ffa9ebaa601884d5b7ef4c1524e27a2f5d5eb91e/diff:/var/lib/docker/overlay2/5c3cc39c39a88c51d0db82d320f18fcb756fa2e0df1572704c63a46bef5e672a/diff:/var/lib/docker/overlay2/afcd8012015c297dde232de0de0d2ab9fa7be1901c26945c6b49f19b3ba1587c/diff:/var/lib/docker/overlay2/ecb854377bb3329a12def32a528a790bc498e8ba495babc34760f0eddfc009d5/diff:/var/lib/docker/overlay2/41d33d3a78edd2c1d5176ad1fbcaed3972b0cf8ed56d3c1e2eee41a828463446/diff:/var/lib/docker/overlay2/4371cecd2bb08c3cc326d3b435b2033079f84c5ebe1eebf270ae5f3515ff09ad/diff:/var/lib/docker/overlay2/a2b96400d27cfad4a4da2d5ae858fca2a889f689379bc7b45de39d9ea01d99b7/diff:/var/lib/docker/overlay2/95c5074bf4d5c24d3fea90c7e19182ecb087aee4f24a5a2dc711ccac94b36cde/diff:/var/lib/docker/overlay2/78aeb85e64f46b08c2c8a9093e04dfe572a5b476a4843f6ffc5f6b74472e8b2a/diff:/var/lib/docker/overlay2/89f84e7d191e64b7eb2e153fd8ff38c43b5e54c9fb59632a8e76d0aa6e204ed9/diff:/var/lib/docker/overlay2/b48abbe0de4e3149ca513ff3bf30d3fab46e4b079caae41816827a2b81d09ffc/diff:/var/lib/docker/overlay2/ae6486b81aa6d8ad9cfcdea232f2ec7bbb8a5db16b1c0aec3f490cb8ed144a46/diff:/var/lib/docker/overlay2/cffb5ce50181eb87e657dca0e8da767e5443331585c595e3ed163c308166af48/diff:/var/lib/docker/overlay2/c340f36011e12a57f3e23d4c6bc84f2dcab369b848cea122db44a2baea527f09/diff:/var/lib/docker/overlay2/ab31f560fc38b550ad4a0232b21d16e082a08186edea098332473339c51f3945/diff:/var/lib/docker/overlay2/ab15529f90b071aab0364ee9d0b2b91b18ba87cfb000aa27048804a2aaab299e/diff:/var/lib/docker/overlay2/f0a4661be96d456b32dd3377693a685c8d392de5f24f845806bd0099b830a053/diff:/var/lib/docker/overlay2/0dc199b8c0a1b56c5888b9415d91b8cf57c01728ad6e9d2984eadea42468155c/diff:/var/lib/docker/overlay2/08e6283f7dc926b616fefcd734d2f45500bb30783682689b8346b70c4247150b/diff:/var/lib/docker/overlay2/c8e88107d467612266259affbaea1269eb6d23e207fd58f46d58e873f1f0ab2c/diff:/var/lib/docker/overlay2/8a6c55b1d0292417f4c05a893c3c97174ca90a1e31f6663b1a7002955abc6442/diff:/var/lib/docker/overlay2/64a1d848d3540fa3bb3a7ec87b7cbe3829a7e8ab16529359e15a17887e211d08/diff:/var/lib/docker/overlay2/ba99098ccb01c727ba14696809fffda193627150597f9da1f35efc8553e849f4/diff:/var/lib/docker/overlay2/efb918ead7faf2f76fdb892d67710400e0a9dcd3152d351fec14382983d89f74/diff:/var/lib/docker/overlay2/b3a147bc5f3f02e4b8bae9098fb119cd24eea6cd771725916df0c4ea0458be38/diff:/var/lib/docker/overlay2/de3c6bb3d96e8e079618fb21c42126a294f4e6d818e0ff247a5f0431af4ca1be/diff:/var/lib/docker/overlay2/e18cf8be2355d1f8e63fe801b7816973d8c6131aee34ae34502f6ec16c14bbaf/diff:/var/lib/docker/overlay2/f6584dca58e98258b123ce209c4e66d520a240910fd46054ea91b5c007ad0dd0/diff:/var/lib/docker/overlay2/1c221cad4988ebeb921c400706426b948cffb704a1d03381ffe5f1561b42df75/diff:/var/lib/docker/overlay2/14711fefb3b17e33c34d584915c2b0d669b8b8800bc709d8665da10b13b2cc87/diff:/var/lib/docker/overlay2/791c0c8da0ce89310b49d06adf980faddbc116274710f857b1507e1d995ec661/diff:/var/lib/docker/overlay2/7997fe0441f4cdb20e7768b69d963528a1c076600126d393e026f9b87eb3ffd3/diff", "MergedDir": "/var/lib/docker/overlay2/f86fbf0f96243c4b9ca7869879e5dd4f2ffd11fd9fccf005965a9b43ae7acdfa/merged", "UpperDir": "/var/lib/docker/overlay2/f86fbf0f96243c4b9ca7869879e5dd4f2ffd11fd9fccf005965a9b43ae7acdfa/diff", "WorkDir": "/var/lib/docker/overlay2/f86fbf0f96243c4b9ca7869879e5dd4f2ffd11fd9fccf005965a9b43ae7acdfa/work" }, "Name": "overlay2" }, "Mounts": [ { "Type": "bind", "Source": "/data", "Destination": "/data", "Mode": "", "RW": true, "Propagation": "rprivate" }, { "Type": "bind", "Source": "/public/devops", "Destination": "/devops", "Mode": "", "RW": true, "Propagation": "rprivate" } ], "Config": { "Hostname": "p-jn-sz-dell-h1-su3-gpu02-402-11e-02u-208-64", "Domainname": "", "User": "", "AttachStdin": false, "AttachStdout": false, "AttachStderr": false, "ExposedPorts": { "6006/tcp": {}, "8888/tcp": {} }, "Tty": true, "OpenStdin": true, "StdinOnce": false, "Env": [ "PATH=/usr/local/lib/python3.10/dist-packages/torch_tensorrt/bin:/usr/local/mpi/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/tensorrt/bin", "CUDA_VERSION=12.5.0.023", "CUDA_DRIVER_VERSION=555.42.02", "CUDA_CACHE_DISABLE=1", "NVIDIA_REQUIRE_JETPACK_HOST_MOUNTS=", "_CUDA_COMPAT_PATH=/usr/local/cuda/compat", "ENV=/etc/shinit_v2", "BASH_ENV=/etc/bash.bashrc", "SHELL=/bin/bash", "NVIDIA_REQUIRE_CUDA=cuda>=9.0", "NCCL_VERSION=2.21.5", "CUBLAS_VERSION=12.5.2.13", "CUFFT_VERSION=11.2.3.18", "CURAND_VERSION=10.3.6.39", "CUSPARSE_VERSION=12.4.1.24", "CUSOLVER_VERSION=11.6.2.40", "CUTENSOR_VERSION=2.0.1.2", "NPP_VERSION=12.3.0.116", "NVJPEG_VERSION=12.3.2.38", "CUDNN_VERSION=9.1.0.70+cuda12.4", "TRT_VERSION=10.1.0.27+cuda12.4.1.003", "TRTOSS_VERSION=24.06", "NSIGHT_SYSTEMS_VERSION=2024.2.3.38", "NSIGHT_COMPUTE_VERSION=2024.2.0.16", "DALI_VERSION=1.38.0", "DALI_BUILD=15028468", "POLYGRAPHY_VERSION=0.49.11", "TRANSFORMER_ENGINE_VERSION=1.7", "MODEL_OPT_VERSION=0.11.2", "LD_LIBRARY_PATH=/usr/local/lib/python3.10/dist-packages/torch/lib:/usr/local/lib/python3.10/dist-packages/torch_tensorrt/lib:/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64", "NVIDIA_VISIBLE_DEVICES=all", "NVIDIA_DRIVER_CAPABILITIES=compute,utility,video", "NVIDIA_PRODUCT_NAME=PyTorch", "GDRCOPY_VERSION=2.3.1-1", "HPCX_VERSION=2.19", "MOFED_VERSION=5.4-rdmacore39.0", "OPENUCX_VERSION=1.17.0", "OPENMPI_VERSION=4.1.7", "RDMACORE_VERSION=39.0", "OPAL_PREFIX=/opt/hpcx/ompi", "OMPI_MCA_coll_hcoll_enable=0", "LIBRARY_PATH=/usr/local/cuda/lib64/stubs:", "PYTORCH_BUILD_VERSION=2.4.0a0+f70bd71", "PYTORCH_VERSION=2.4.0a0+f70bd71", "PYTORCH_BUILD_NUMBER=0", "NVIDIA_PYTORCH_VERSION=24.06", "NVFUSER_BUILD_VERSION=f73ff1b", "NVFUSER_VERSION=f73ff1b", "PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python", "NVPL_LAPACK_MATH_MODE=PEDANTIC", "PYTHONIOENCODING=utf-8", "LC_ALL=C.UTF-8", "PIP_DEFAULT_TIMEOUT=100", "NVM_DIR=/usr/local/nvm", "NODE_OPTIONS=--openssl-legacy-provider", "JUPYTER_PORT=8888", "TENSORBOARD_PORT=6006", "UCC_CL_BASIC_TLS=^sharp", "TORCH_CUDA_ARCH_LIST=5.2 6.0 6.1 7.0 7.2 7.5 8.0 8.6 8.7 9.0+PTX", "PYTORCH_HOME=/opt/pytorch/pytorch", "CUDA_HOME=/usr/local/cuda", "TORCH_ALLOW_TF32_CUBLAS_OVERRIDE=1", "USE_EXPERIMENTAL_CUDNN_V8_API=1", "COCOAPI_VERSION=2.0+nv0.8.0", "TORCH_CUDNN_V8_API_ENABLED=1", "CUDA_MODULE_LOADING=LAZY", "NVIDIA_BUILD_ID=96418707", "PIP_INDEX_URL=https://pypi.tuna.tsinghua.edu.cn/simple" ], "Cmd": [ "/usr/sbin/sshd", "-D", "-p", "60023" ], "Image": "70d86cd35082", "Volumes": null, "WorkingDir": "/workspace", "Entrypoint": [ "/opt/nvidia/nvidia_entrypoint.sh" ], "OnBuild": null, "Labels": { "airs-user": "airs-user", "com.nvidia.build.id": "96418707", "com.nvidia.build.ref": "3017efeca4038be2c8c0f965cf868f48051bff16", "com.nvidia.cublas.version": "12.5.2.13", "com.nvidia.cuda.version": "9.0", "com.nvidia.cudnn.version": "9.1.0.70+cuda12.4", "com.nvidia.cufft.version": "11.2.3.18", "com.nvidia.curand.version": "10.3.6.39", "com.nvidia.cusolver.version": "11.6.2.40", "com.nvidia.cusparse.version": "12.4.1.24", "com.nvidia.cutensor.version": "2.0.1.2", "com.nvidia.nccl.version": "2.21.5", "com.nvidia.npp.version": "12.3.0.116", "com.nvidia.nsightcompute.version": "2024.2.0.16", "com.nvidia.nsightsystems.version": "2024.2.3.38", "com.nvidia.nvjpeg.version": "12.3.2.38", "com.nvidia.pytorch.version": "2.4.0a0+f70bd71", "com.nvidia.tensorrt.version": "10.1.0.27+cuda12.4.1.003", "com.nvidia.tensorrtoss.version": "24.06", "com.nvidia.volumes.needed": "nvidia_driver", "library": "library", "org.opencontainers.image.ref.name": "ubuntu", "org.opencontainers.image.version": "22.04" } }, "NetworkSettings": { "Bridge": "", "SandboxID": "b213c086b02c6f0033a3a22c17ddbb9979829c55ff42d509c4f957a7556b006b", "HairpinMode": false, "LinkLocalIPv6Address": "", "LinkLocalIPv6PrefixLen": 0, "Ports": {}, "SandboxKey": "/var/run/docker/netns/default", "SecondaryIPAddresses": null, "SecondaryIPv6Addresses": null, "EndpointID": "", "Gateway": "", "GlobalIPv6Address": "", "GlobalIPv6PrefixLen": 0, "IPAddress": "", "IPPrefixLen": 0, "IPv6Gateway": "", "MacAddress": "", "Networks": { "host": { "IPAMConfig": null, "Links": null, "Aliases": null, "NetworkID": "7708d594bfe6066cbde4ca0f4ee443bd7f69afc3c7d723b702046f8530da7cdd", "EndpointID": "6034de2abfb872f3d8b1c4f69cb2fd30bcdbbd01d5b78dfce02075c01d576818", "Gateway": "", "IPAddress": "", "IPPrefixLen": 0, "IPv6Gateway": "", "GlobalIPv6Address": "", "GlobalIPv6PrefixLen": 0, "MacAddress": "", "DriverOpts": null } } } } ]