Skip to content

Commit 1a34f7a

Browse files
authored
Merge branch 'PaddlePaddle:develop' into develop
2 parents 78a0952 + 31c219d commit 1a34f7a

129 files changed

Lines changed: 18289 additions & 701 deletions

File tree

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/workflows/_gpu_4cards_case_test.yml

Lines changed: 1 addition & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -190,24 +190,5 @@ jobs:
190190
export PYTHONPATH=/workspace/FastDeploy/
191191
192192
export CUDA_VISIBLE_DEVICES=0,1,2,3
193-
echo "============================================================"
194-
echo "Running pytest for 4-GPU end-to-end cases"
195-
196-
python -m pytest -sv --tb=short tests/e2e/4cards_cases/
197-
exit_code=$?
198-
199-
if [ $exit_code -ne 0 ]; then
200-
if [ -f "./log/log_0/workerlog.0" ]; then
201-
echo "---------------- log/workerlog.0 -------------------"
202-
cat "./log/log_0/workerlog.0"
203-
echo "----------------------------------------------------"
204-
fi
205-
206-
if [ -f "./server.log" ]; then
207-
echo "---------------- server.log ----------------"
208-
cat "./server.log"
209-
echo "--------------------------------------------"
210-
fi
211-
exit 1
212-
fi
193+
bash scripts/run_gpu_4cards.sh
213194
'

.github/workflows/ce_job.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -162,7 +162,7 @@ jobs:
162162
if: ${{ needs.ce_job_pre_check.outputs.sm8090_match == 'true' }}
163163
uses: ./.github/workflows/_build_linux_rl.yml
164164
with:
165-
DOCKER_IMAGE: iregistry.baidu-int.com/tiangexiao/base-images:paddlecloud-ubuntu24.04-gcc13.3-cuda12.9-cudnn9.9-bccl1.4.1.4-nccl2.26.5-openmpi4.1.5-FleetY13.0.0-rc2
165+
DOCKER_IMAGE: iregistry.baidu-int.com/new_rl_infra/base-images:paddlecloud-ubuntu24.04-gcc13.3-cuda12.9-cudnn9.9-bccl1.4.1.4-nccl2.26.5-openmpi4.1.5-FleetY13.0.0-v2.4.0-rc1
166166
FASTDEPLOY_ARCHIVE_URL: ${{ needs.clone.outputs.repo_archive_url }}
167167
COMPILE_ARCH: "80,90"
168168
WITH_NIGHTLY_BUILD: OFF

custom_ops/gpu_ops/swap_cache_layout.cu

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,6 +73,11 @@ void SwapCacheImpLayout(
7373
copy_kind,
7474
stream);
7575

76+
PADDLE_ENFORCE_EQ(status,
77+
cudaSuccess,
78+
phi::errors::External("cudaMemcpyAsync failed: %s",
79+
cudaGetErrorString(status)));
80+
7681
#ifdef SWAP_DEBUG
7782
cudaStreamSynchronize(stream);
7883
std::cout << "mode:" << mode << ", layer_idx:" << layer_idx
@@ -81,7 +86,11 @@ void SwapCacheImpLayout(
8186
#endif
8287
}
8388
}
84-
cudaStreamSynchronize(stream);
89+
cudaError_t sync_status = cudaStreamSynchronize(stream);
90+
PADDLE_ENFORCE_EQ(sync_status,
91+
cudaSuccess,
92+
phi::errors::External("cudaStreamSynchronize failed: %s",
93+
cudaGetErrorString(sync_status)));
8594
}
8695

8796
void SwapCacheLayout(

dockerfiles/Dockerfile.gpu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
FROM ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/fastdeploy-cuda-12.6:tag-base
2-
ARG PADDLE_VERSION=3.2.1
3-
ARG FD_VERSION=2.3.0
2+
ARG PADDLE_VERSION=3.3.0
3+
ARG FD_VERSION=2.4.0
44

55
ENV DEBIAN_FRONTEND=noninteractive
66

docs/get_started/installation/nvidia_gpu.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ docker pull ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/fastdeploy-cuda-12
2323
First install paddlepaddle-gpu. For detailed instructions, refer to [PaddlePaddle Installation](https://www.paddlepaddle.org.cn/en/install/quick?docurl=/documentation/docs/en/develop/install/pip/linux-pip_en.html)
2424
```shell
2525
# Install stable release
26-
python -m pip install paddlepaddle-gpu==3.2.1 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
26+
python -m pip install paddlepaddle-gpu==3.3.0 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
2727

2828
# Install latest Nightly build
2929
python -m pip install --pre paddlepaddle-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/cu126/
@@ -34,7 +34,7 @@ Then install fastdeploy. **Do not install from PyPI**. Use the following methods
3434
For SM80/90 architecture GPUs(e.g A30/A100/H100/):
3535
```
3636
# Install stable release
37-
python -m pip install fastdeploy-gpu==2.3.3 -i https://www.paddlepaddle.org.cn/packages/stable/fastdeploy-gpu-80_90/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
37+
python -m pip install fastdeploy-gpu==2.4.0 -i https://www.paddlepaddle.org.cn/packages/stable/fastdeploy-gpu-80_90/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
3838
3939
# Install latest Nightly build
4040
python -m pip install fastdeploy-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/fastdeploy-gpu-80_90/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
@@ -43,7 +43,7 @@ python -m pip install fastdeploy-gpu -i https://www.paddlepaddle.org.cn/packages
4343
For SM86/89 architecture GPUs(e.g A10/4090/L20/L40):
4444
```
4545
# Install stable release
46-
python -m pip install fastdeploy-gpu==2.3.3 -i https://www.paddlepaddle.org.cn/packages/stable/fastdeploy-gpu-86_89/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
46+
python -m pip install fastdeploy-gpu==2.4.0 -i https://www.paddlepaddle.org.cn/packages/stable/fastdeploy-gpu-86_89/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
4747
4848
# Install latest Nightly build
4949
python -m pip install fastdeploy-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/fastdeploy-gpu-86_89/ --extra-index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
@@ -64,7 +64,7 @@ docker build -f dockerfiles/Dockerfile.gpu -t fastdeploy:gpu .
6464

6565
First install paddlepaddle-gpu. For detailed instructions, refer to [PaddlePaddle Installation](https://www.paddlepaddle.org.cn/en/install/quick?docurl=/documentation/docs/en/develop/install/pip/linux-pip_en.html)
6666
```shell
67-
python -m pip install paddlepaddle-gpu==3.2.1 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
67+
python -m pip install paddlepaddle-gpu==3.3.0 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
6868
```
6969

7070
Then clone the source code and build:
@@ -92,7 +92,7 @@ First, install paddlepaddle-gpu.
9292
For detailed instructions, please refer to the [PaddlePaddle Installation Guide](https://www.paddlepaddle.org.cn/).
9393

9494
```shell
95-
python -m pip install paddlepaddle-gpu==3.2.0 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
95+
python -m pip install paddlepaddle-gpu==3.3.0 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/
9696
```
9797

9898
Then, clone the FastDeploy repository and build using the precompiled operator wheels:

0 commit comments

Comments
 (0)