Skip to content

Update fastapi_server_vlm.py #3

Update fastapi_server_vlm.py

Update fastapi_server_vlm.py #3

name: Build and Push Qwen2-VL-RK3588 Series
on:
push:
branches: [ main, master ]
paths:
- 'src/vlm/**'
- 'docker/RK3588/VLM/Qwen2-VL.dockerfile'
- '.github/workflows/RK3588-Qwen2-VL.yml'
- 'lib/**'
workflow_dispatch:
env:
REGISTRY: ghcr.io
IMAGE_BASE_NAME: ${{ github.repository_owner }}/RK3588-Qwen2-VL
jobs:
build-and-push:
runs-on: ubuntu-latest
permissions:
contents: read
packages: write
strategy:
fail-fast: false
matrix:
include:
- alias: "7b-w8a8"
vision_file: "Qwen2_VL_7B_VISION_RK3588.rknn"
vision_url: "https://huggingface.co/JiahaoLi/Qwen2-VL-RK3588/resolve/main/Qwen2_VL_7B_VISION_RK3588.rknn"
llm_file: "Qwen2_VL_7B_LLM_RK3588.rkllm"
llm_url: "https://huggingface.co/JiahaoLi/Qwen2-VL-RK3588/resolve/main/Qwen2-VL-7B_LLM_W8A8_RK3588.rkllm"
- alias: "2b-w8a8"
vision_file: "Qwen2_VL_2B_VISION_RK3588.rknn"
vision_url: "https://huggingface.co/JiahaoLi/Qwen2-VL-RK3588/resolve/main/Qwen2-VL-2B_VISION_RK3588.rknn"
llm_file: "Qwen2_VL_2B_LLM_RK3588.rkllm"
llm_url: "https://huggingface.co/JiahaoLi/Qwen2-VL-RK3588/resolve/main/Qwen2-VL-2B_LLM_W8A8_RK3588.rkllm"
steps:
- name: Checkout repository
uses: actions/checkout@v4
with:
lfs: true
- name: Force LFS Pull
run: |
git lfs install
git lfs pull
- name: Free Disk Space
uses: jlumbroso/free-disk-space@main
with:
tool-cache: true
android: true
dotnet: true
large-packages: true
docker-images: true
- name: Set up QEMU
uses: docker/setup-qemu-action@v3
with:
platforms: arm64
- name: Set up Docker Buildx
uses: docker/setup-buildx-action@v3
- name: Log in to GHCR
uses: docker/login-action@v3
with:
registry: ${{ env.REGISTRY }}
username: ${{ github.actor }}
password: ${{ secrets.GITHUB_TOKEN }}
- name: Extract metadata
id: meta
uses: docker/metadata-action@v5
with:
images: ${{ env.REGISTRY }}/${{ env.IMAGE_BASE_NAME }}
tags: |
type=raw,value=${{ matrix.alias }}-latest
- name: Build and push
uses: docker/build-push-action@v5
with:
context: .
file: ./docker/RK3588/VLM/Qwen2-VL.dockerfile
# 重要:不指定 target,确保所有指令被执行
push: true
platforms: linux/arm64
provenance: false
build-args: |
LLM_URL=${{ matrix.llm_url }}
LLM_FILE=${{ matrix.llm_file }}
VISION_URL=${{ matrix.vision_url }}
VISION_FILE=${{ matrix.vision_file }}
tags: ${{ steps.meta.outputs.tags }}
labels: ${{ steps.meta.outputs.labels }}
cache-from: type=gha
cache-to: type=gha,mode=max