Merge branch 'paddle' into 'dev'

Paddle See merge request !5

Merge branch 'paddle' into 'dev'
Paddle See merge request !5
ec5e8d89 · chenpangpang · 1440eb08 · 338ca45c · ec5e8d89 · ec5e8d89
Commit ec5e8d89 authored Nov 05, 2024 by chenpangpang
8 changed files
--- a/README.md
+++ b/README.md
@@ -52,13 +52,31 @@
    - 参数3: 基础镜像
    - TENSORFLOW_VERSION：tensorflow版本
    - CONDA_URL：安装conda的url
+  - paddlepaddle
+      ```bash
+    cd build_space && \
+    ./build_ubuntu.sh jupyterlab \
+                      jupyterlab-paddle:2.6-py3.11-cuda12.0-ubuntu22.04-devel \
+                      nvidia/cuda:12.0.0-cudnn8-devel-ubuntu22.04 \
+                      PADDLEPADDLE_VERSION="2.6.0.post120" \
+                      PADDLENLP_VERSION="2.7.2" \
+                      CONDA_URL="https://mirrors.tuna.tsinghua.edu.cn/anaconda/miniconda/Miniconda3-py311_24.7.1-0-Linux-x86_64.sh" \
+                      PADDLE_URL="https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    ```
+    - 参数1: ide，不需要改动
+    - 参数2: 输出镜像名
+    - 参数3: 基础镜像
+    - PADDLEPADDLE_VERSION：paddlepaddle版本
+    - PADDLENLP_VERSION: 
+    - CONDA_URL：安装conda的url
+    - PADDLE_URL: paddlepaddle 安装源，为空表示从默认源下载（清华源）

 ### 相关链接
 - pytorch镜像(**选择devel镜像**)：https://hub.docker.com/r/pytorch/pytorch/tags
 - nvidia镜像(**选择devel镜像**)：https://hub.docker.com/r/nvidia/cuda/tags
 - torch、torchvision、torchaudio、cuda版本对应：https://pytorch.org/get-started/previous-versions/
 - conda安装：https://mirrors.tuna.tsinghua.edu.cn/anaconda/miniconda/
-
+- paddlepaddle依赖参考：attach/paddle.json
 ## 镜像验证
 1. 版本验证：运行：`sh script/1_base_test.sh $IMAGE_NAME`，输出：
  ```
@@ -131,4 +149,4 @@ The output image has been saved as output.png
 - 根据计划表和镜像tag表，获取base镜像名称、输出镜像名称
 - 飞书机器人-自动统计镜像制作情况
 - 飞书机器人-待推送镜像提醒
- CI/CD流程
\ No newline at end of file
+- CI/CD流程
--- a/attach/paddle.json
+++ b/attach/paddle.json
+[
+    {
+        "paddle_excel_version": "3.0-beta",
+        "cuda_version": "cuda12.3",
+        "paddle_version": "3.0.0b2",
+        "paddlenlp_version": "3.0.0b0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/packages/stable/cu123/"
+    },
+    {
+        "paddle_excel_version": "3.0-beta",
+        "cuda_version": "cuda11.8",
+        "paddle_version": "3.0.0b2",
+        "paddlenlp_version": "3.0.0b0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/packages/stable/cu118/"
+    },
+    {
+        "paddle_excel_version": "2.6",
+        "cuda_version": "cuda12.0",
+        "paddle_version": "2.6.0.post120",
+        "paddlenlp_version": "2.7.2",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.6",
+        "cuda_version": "cuda11.8",
+        "paddle_version": "2.6.0",
+        "paddlenlp_version": "2.8.1",
+        "paddle_url": null
+    },
+   {
+        "paddle_excel_version": "2.5",
+        "cuda_version": "cuda12.0",
+        "paddle_version": "2.5.2.post120",
+        "paddlenlp_version": "2.5.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.5",
+        "cuda_version": "cuda11.7",
+        "paddle_version": "2.5.2.post117",
+        "paddlenlp_version": "2.5.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+   {
+        "paddle_excel_version": "2.4",
+        "cuda_version": "cuda11.7",
+        "paddle_version": "2.4.2.post117",
+        "paddlenlp_version": "2.4.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.4",
+        "cuda_version": "cuda11.6",
+        "paddle_version": "2.4.2.post116",
+        "paddlenlp_version": "2.5.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.3",
+        "cuda_version": "cuda11.6",
+        "paddle_version": "2.3.2.post116",
+        "paddlenlp_version": "2.5.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.3",
+        "cuda_version": "cuda11.2",
+        "paddle_version": "2.3.2.post112",
+        "paddlenlp_version": "2.4.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.2",
+        "cuda_version": "cuda11.2",
+        "paddle_version": "2.2.2.post112",
+        "paddlenlp_version": "2.2.0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.2",
+        "cuda_version": "cuda11.1",
+        "paddle_version": "2.2.2.post110",
+        "paddlenlp_version": "2.2.0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.1",
+        "cuda_version": "cuda11.2",
+        "paddle_version": "2.1.3.post112",
+        "paddlenlp_version": "2.1.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.1",
+        "cuda_version": "cuda11.0",
+        "paddle_version": "2.1.3.post110",
+        "paddlenlp_version": "2.1.1",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.0",
+        "cuda_version": "cuda10.1",
+        "paddle_version": "2.0.2.post101",
+        "paddlenlp_version": "2.0.0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/mkl/stable.html"
+    },
+    {
+        "paddle_excel_version": "2.0",
+        "cuda_version": "cuda10.0",
+        "paddle_version": "2.0.2.post100",
+        "paddlenlp_version": "2.0.0",
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/mkl/stable.html"
+    },
+    {
+        "paddle_excel_version": "1.8",
+        "cuda_version": "cuda10.1",
+        "paddle_version": "1.8.5.post107",
+        "paddlenlp_version": null,
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    },
+    {
+        "paddle_excel_version": "1.8",
+        "cuda_version": "cuda10.0",
+        "paddle_version": "1.8.5.post107",
+        "paddlenlp_version": null,
+        "paddle_url": "https://www.paddlepaddle.org.cn/whl/linux/mkl/avx/stable.html"
+    }
+]
--- a/auto_build.py
+++ b/auto_build.py
@@ -7,7 +7,8 @@ import time
 from concurrent.futures import ThreadPoolExecutor, wait, ALL_COMPLETED
 import argparse
 import logging
-
+import json
+from packaging.version import Version

 class MyLogger:
    def __init__(self, logger_name, log_file, console_handler=True, level=logging.INFO):
@@ -92,12 +93,29 @@ def package_and_transfer(image_name, tar_file, image_result_dir, logger):

    logger.info(f"==== 镜像 {image_name} 传输完毕  ====")

+# 从json中获取paddle安装信息
+def get_paddle_info(paddlepaddle_version, cuda_version):
+    # 读取 JSON 数据
+    with open("attach/paddle.json", "r", encoding="utf-8") as file:
+        version_data = json.load(file)
+    for item in version_data:
+        if item["paddle_excel_version"] == paddlepaddle_version and item["cuda_version"] == cuda_version:
+            return {
+                "paddle_version": item["paddle_version"],
+                "paddlenlp_version": item["paddlenlp_version"],
+                "paddle_url": item["paddle_url"]
+            }
+    return None
+

 def run():
    # 读取Excel文件
    df = pd.read_excel(args.input_file)
    os.makedirs(args.log_dir, exist_ok=True)
-
+    
+    paddle_version = None
+    paddlenlp_version = None
+    paddle_url = None
    # 创建线程池
    with ThreadPoolExecutor() as executor:
        # 遍历每一行数据，自动构建镜像
@@ -107,6 +125,7 @@ def run():
            framework_version = row['框架版本']  # 直接获取框架版本作为 framework_VERSION
            other_dependencies = row['其他依赖包']
            conda_url = row['conda url']  # 获取conda URL
+            cuda_version = row['Runtime版本'].strip().lower()  # 获取 CUDA 版本

            # 日志文件
            if os.path.exists(os.path.join(args.log_dir, image_name)):
@@ -137,6 +156,17 @@ def run():
            if torchaudio_version is None:
                torchaudio_version = "未找到版本号"

+            # 处理比较复杂的下载或依赖关系
+            if isinstance(base_image, str):
+                if "paddle" in image_name:
+                    paddle_info = get_paddle_info(str(framework_version), str(cuda_version))
+                    if paddle_info:
+                        paddle_version = paddle_info["paddle_version"]
+                        paddlenlp_version = paddle_info["paddlenlp_version"]
+                        paddle_url = paddle_info["paddle_url"]
+                    else:
+                        print("未找到指定的 PaddlePaddle 和 CUDA 版本信息")
+
            # 基于 PyTorch 或 NVIDIA 镜像的构建逻辑
            if isinstance(base_image, str):
                if "pytorch" in image_name:
@@ -166,6 +196,17 @@ def run():
                    CONDA_URL="{conda_url}" \
                    2>&1 | tee ../{args.log_dir}/{image_name}/build.log
                    """
+                elif "paddle" in image_name:
+                    build_command = f"""
+                    cd build_space && \
+                    ./build_ubuntu.sh jupyterlab {image_name} {base_image} \
+                    PADDLEPADDLE_VERSION="{paddle_version}" \
+                    PADDLENLP_VERSION="{paddlenlp_version}" \
+                    CONDA_URL="{conda_url}" \
+                    PADDLE_URL="{paddle_url}" \
+                    2>&1 | tee ../{args.log_dir}/{image_name}/build.log
+                    """
+

            # 打印构建命令（用于调试）
            logger.info(build_command)
@@ -190,6 +231,11 @@ def run():
            if "pytorch" in image_name:
                test_commands.append(
                    f"mv gpu-base-image-test/pytorch/stable-diffusion-v1-4/output.png {image_result_dir}")
+            elif "paddle" in image_name:
+                # 使用 Version 进行版本比较
+                if Version(paddle_version) >= Version("2.4"):
+                    test_commands.append(
+                        f"mv gpu-base-image-test/paddle/output.png {image_result_dir}")

            # 执行测试命令
            for test_command in test_commands:

--- a/build_space/Dockerfile.jupyterlab_ubuntu
+++ b/build_space/Dockerfile.jupyterlab_ubuntu
@@ -104,8 +104,15 @@ RUN if [ $TENSORFLOW_VERSION == "2.16.1" ]; then \

 # ----- paddlepaddle install -----
 RUN if [ -n "$PADDLEPADDLE_VERSION" ] && [ -n "$PADDLE_URL" ]; then \
-    pip install paddlepaddle-gpu==$PADDLEPADDLE_VERSION -f $PADDLE_URL -i $PADDLE_URL \
-    && rm -r /root/.cache/pip; \
+    if [ "$(echo -e "$PADDLEPADDLE_VERSION\n3.0" | sort -V | head -n1)" = "3.0" ]; then \
+        # 处理 PADDLEPADDLE_VERSION >= 3.0 的情况
+        pip install paddlepaddle-gpu==$PADDLEPADDLE_VERSION -f $PADDLE_URL -i $PADDLE_URL && \
+        rm -r /root/.cache/pip; \
+    else \
+        # 处理 PADDLEPADDLE_VERSION < 3.0 的情况
+        pip install paddlepaddle-gpu==$PADDLEPADDLE_VERSION -f $PADDLE_URL && \
+        rm -r /root/.cache/pip; \
+    fi; \
 fi

 RUN if [ -n "$PADDLEPADDLE_VERSION" ] && [ -z "$PADDLE_URL" ]; then \
@@ -114,10 +121,21 @@ RUN if [ -n "$PADDLEPADDLE_VERSION" ] && [ -z "$PADDLE_URL" ]; then \
 fi

 RUN if [ -n "$PADDLENLP_VERSION" ] ; then \
-    pip install paddlenlp==$PADDLENLP_VERSION ppdiffusers huggingface_hub --no-cache-dir  -i https://pypi.tuna.tsinghua.edu.cn/simple && \
-    pip install --upgrade ppdiffusers --no-deps  && rm -r /root/.cache/pip; \
+    if [ -n "$PADDLEPADDLE_VERSION" ] && \
+       [ "$(echo -e "$PADDLEPADDLE_VERSION\n2.3" | sort -V | head -n1)" = "2.3" ]; then \
+        # 处理 PADDLEPADDLE_VERSION >= 2.3 的情况
+        pip install paddlenlp==$PADDLENLP_VERSION ppdiffusers huggingface_hub==0.25.0 --no-cache-dir -i https://pypi.tuna.tsinghua.edu.cn/simple && \
+        rm -r /root/.cache/pip; \
+    else \
+        # 处理 PADDLEPADDLE_VERSION < 2.3 的情况
+        pip install paddlenlp==$PADDLENLP_VERSION numpy==1.19.5 protobuf==3.20.3 --no-cache-dir -i https://pypi.tuna.tsinghua.edu.cn/simple && \
+        # 替换小于2.3版本中np.object为object
+        sed -i 's/np\.object/object/g' /opt/conda/lib/python3.*/site-packages/paddle/**/*.py && \
+        rm -r /root/.cache/pip; \
+    fi; \
 fi

+
 COPY ./python-requirements.txt /tmp/
 RUN pip install --no-cache-dir -r /tmp/python-requirements.txt


--- a/build_space/extension.sh
+++ b/build_space/extension.sh
@@ -56,9 +56,9 @@ cp -a $WORKSPACE/static/index.html ${jupyter_file_path}/static/index.html
 cp -a $WORKSPACE/static/scnet-loading.gif ${jupyter_file_path}/static/scnet-loading.gif


-pip3 uninstall -r $WORKSPACE/requirements.txt
+pip3 uninstall -r $WORKSPACE/requirements.txt -y

-pip3 install --no-index --find-links=$WORKSPACE/ -r $WORKSPACE/requirements.txt
+pip3 install --no-index --find-links=$WORKSPACE/ -r $WORKSPACE/requirements.txt 

 if  pip list | grep -E 'jupyter_ext_platform' && pip list | grep -E 'jupyter_ext_model' && pip list | grep -E 'jupyterlab-language-pack-zh-CN' && [ "$(jupyter lab --version | cut -d. -f1)" -gt 2 ];then echo "安装成功";else echo \"安装失败！！ \" | tee /jupyter-ext/errorImages.txt; fi


--- a/script/1_base_test.sh
+++ b/script/1_base_test.sh
@@ -51,7 +51,7 @@ elif [[ "$1" == *"tensorflow"* ]]; then
      os.system('nvcc -V | tail -n 2')
      "; fi
 elif [[ "$1" == *"paddle"* ]]; then
-  TARGET_DIR=gpu-base-image-test/paddletest
+  TARGET_DIR=gpu-base-image-test/paddle
  docker run --rm --platform=linux/amd64 --gpus all -v ./$TARGET_DIR:/workspace --workdir /workspace $1 python base_test.py

 else

--- a/script/2_text_test.sh
+++ b/script/2_text_test.sh
@@ -21,7 +21,7 @@ if [[ "$1" == *"tensorflow"* ]]; then
  else
    docker run --rm --platform=linux/amd64 --gpus all -v ./$TARGET_DIR:/workspace --workdir /workspace/tensorflow/bert $1 python infer.py; fi; fi
 if [[ "$1" == *"paddle"* ]]; then 
-   TARGET_DIR=gpu-base-image-test/paddletest 
+   TARGET_DIR=gpu-base-image-test/paddle 
   docker run --rm --platform=linux/amd64 --gpus all -v ./$TARGET_DIR:/workspace --workdir /workspace $1 python text.py; fi


--- a/script/3_image_test.sh
+++ b/script/3_image_test.sh
@@ -22,7 +22,7 @@ if [[ "$1" == *"tensorflow"* ]]; then
    docker run --rm --platform=linux/amd64 --gpus all -v ./$TARGET_DIR:/workspace --workdir /workspace/tensorflow/mnist $1 python train.py; fi; fi 

 if [[ "$1" == *"paddle"* ]]; then 
-  TARGET_DIR=gpu-base-image-test/paddletest 
+  TARGET_DIR=gpu-base-image-test/paddle 
  docker run --rm --platform=linux/amd64 --gpus all -v ./$TARGET_DIR:/workspace --workdir /workspace $1 python image.py; fi