Skip to content

x86 optimization for gemm int8 #4794

x86 optimization for gemm int8

x86 optimization for gemm int8 #4794

name: linux-riscv64-cpu-gcc
on:
push:
branches: [master]
paths:
- '.github/workflows/linux-riscv64-cpu-gcc.yml'
- 'toolchains/riscv64-linux-gnu.toolchain.cmake'
- 'toolchains/riscv64-unknown-linux-gnu.toolchain.cmake'
- 'CMakeLists.txt'
- 'cmake/**'
- 'src/*'
- 'src/layer/*'
- 'src/layer/riscv/**'
- 'tests/**'
pull_request:
branches: [master]
paths:
- '.github/workflows/linux-riscv64-cpu-gcc.yml'
- 'toolchains/riscv64-linux-gnu.toolchain.cmake'
- 'toolchains/riscv64-unknown-linux-gnu.toolchain.cmake'
- 'CMakeLists.txt'
- 'cmake/**'
- 'src/*'
- 'src/layer/*'
- 'src/layer/riscv/**'
- 'tests/**'
concurrency:
group: linux-riscv64-cpu-gcc-${{ github.ref }}
cancel-in-progress: true
permissions:
contents: read
jobs:
linux-gcc-riscv64:
runs-on: ubuntu-20.04
steps:
- uses: actions/checkout@v4
- name: cache-qemu
id: cache-qemu
uses: actions/cache@v4
with:
path: qemu-install
key: qemu-riscv64-install-20220502-4
- name: install-qemu-build-deps
if: steps.cache-qemu.outputs.cache-hit != 'true'
run: |
sudo apt-get update
sudo apt-get install autoconf automake autotools-dev ninja-build
- name: checkout-qemu
if: steps.cache-qemu.outputs.cache-hit != 'true'
uses: actions/checkout@v4
with:
repository: qemu/qemu
path: qemu
ref: f5643914a9e8f79c606a76e6a9d7ea82a3fc3e65
- name: qemu
if: steps.cache-qemu.outputs.cache-hit != 'true'
run: |
cd qemu
wget https://raw.githubusercontent.com/nihui/ncnn-assets/master/qemu-patches/0007-linux-user-Expose-risc-v-V-isa-bit-in-get_elf_hwcap.patch
patch -p1 -i 0007-linux-user-Expose-risc-v-V-isa-bit-in-get_elf_hwcap.patch
./configure --prefix=$GITHUB_WORKSPACE/qemu-install --target-list=riscv64-linux-user --disable-system
make -j$(nproc)
make install
- name: riscv64-gnu-toolchain
run: |
sudo apt-get update
sudo apt-get install g++-riscv64-linux-gnu
- name: configure
run: mkdir build && cd build && cmake -DCMAKE_TOOLCHAIN_FILE=../toolchains/riscv64-linux-gnu.toolchain.cmake -DNCNN_BUILD_TOOLS=OFF -DNCNN_BUILD_EXAMPLES=OFF -DNCNN_BUILD_TESTS=ON ..
- name: build
run: cmake --build build -j $(nproc)
- name: test
run: |
export PATH=$GITHUB_WORKSPACE/qemu-install/bin:$PATH
cd build
TESTS_EXECUTABLE_LOADER=qemu-riscv64 TESTS_EXECUTABLE_LOADER_ARGUMENTS="-L;/usr/riscv64-linux-gnu" ctest --output-on-failure -j $(nproc)
linux-gcc-riscv64-c906:
runs-on: [self-hosted, linux, centos]
steps:
- uses: actions/checkout@v4
- name: configure
run: |
export RISCV_ROOT_PATH=/data/action/osd/Xuantie-900-gcc-linux-5.10.4-glibc-x86_64-V2.6.1
mkdir build && cd build
cmake -DCMAKE_TOOLCHAIN_FILE=../toolchains/c906-v226.toolchain.cmake -DCMAKE_BUILD_TYPE=release -DNCNN_OPENMP=OFF -DNCNN_THREADS=OFF -DNCNN_RUNTIME_CPU=OFF -DNCNN_RVV=ON -DNCNN_SIMPLEOCV=ON -DNCNN_BUILD_EXAMPLES=ON -DNCNN_BUILD_TESTS=ON ..
- name: build
run: cmake --build build -j 4
- name: test
run: |
export PATH=/data/action/osd/xuantie-qemu-x86_64-Ubuntu-18.04-20230413-0706/bin:$PATH
cd build
TESTS_EXECUTABLE_LOADER=qemu-riscv64 TESTS_EXECUTABLE_LOADER_ARGUMENTS="-cpu;c906fdv" ctest --output-on-failure -j 4
linux-gcc-riscv64-rvv:
runs-on: [self-hosted, linux, centos]
steps:
- uses: actions/checkout@v4
#- name: cache-qemu
#id: cache-qemu
#uses: actions/cache@v4
#with:
#path: qemu-install
#key: qemu-riscv64-install-20220502-3
#- name: install-qemu-build-deps
#if: steps.cache-qemu.outputs.cache-hit != 'true'
#run: |
#sudo apt-get update
#sudo apt-get install autoconf automake autotools-dev ninja-build
#- name: checkout-qemu
#if: steps.cache-qemu.outputs.cache-hit != 'true'
#uses: actions/checkout@v4
#with:
#repository: qemu/qemu
#path: qemu
#ref: f5643914a9e8f79c606a76e6a9d7ea82a3fc3e65
#- name: qemu
#if: steps.cache-qemu.outputs.cache-hit != 'true'
#run: |
#cd qemu
#wget https://raw.githubusercontent.com/nihui/ncnn-assets/master/qemu-patches/0007-linux-user-Expose-risc-v-V-isa-bit-in-get_elf_hwcap.patch
#patch -p1 -i 0007-linux-user-Expose-risc-v-V-isa-bit-in-get_elf_hwcap.patch
#./configure --prefix=$GITHUB_WORKSPACE/qemu-install --target-list=riscv64-linux-user --disable-system
#make -j2
#make install
#- name: cache-riscv
#id: cache-riscv
#uses: actions/cache@v4
#with:
#path: rv64gcv-install-next
#key: rv64gcv-linux-install-20210504
#- name: install-riscv-build-deps
#if: steps.cache-riscv.outputs.cache-hit != 'true'
#run: |
#sudo apt-get update
#sudo apt-get install autoconf automake autotools-dev curl python3 libmpc-dev libmpfr-dev libgmp-dev gawk build-essential bison flex texinfo gperf libtool patchutils bc zlib1g-dev libexpat-dev device-tree-compiler
#- name: checkout-riscv-gnu-toolchain
#if: steps.cache-riscv.outputs.cache-hit != 'true'
#uses: actions/checkout@v4
#with:
#repository: riscv/riscv-gnu-toolchain
#path: riscv-gnu-toolchain
#ref: da01ba455ce3802ffa84fdca3a089079996dbfc3
#- name: checkout-riscv-gnu-toolchain-submodules
#if: steps.cache-riscv.outputs.cache-hit != 'true'
#run: |
#cd riscv-gnu-toolchain
#git submodule update --init --recursive --depth 1 glibc
#git submodule update --init --recursive --depth 1 newlib
#git submodule update --init --recursive --depth 1 riscv-binutils
#git submodule update --init --recursive --depth 1 riscv-gcc
#git submodule update --init --recursive --depth 1 riscv-dejagnu
#git submodule update --init --recursive --depth 1 riscv-gdb
#- name: riscv-gnu-toolchain
#if: steps.cache-riscv.outputs.cache-hit != 'true'
#run: |
#cd riscv-gnu-toolchain
#sed -i '/__OBSOLETE_MATH/d' newlib/newlib/libm/common/math_errf.c
#./configure --prefix=$GITHUB_WORKSPACE/rv64gcv-install-next --with-arch=rv64gcv_zfh
#make linux
#- name: riscv-strip-install
#if: steps.cache-riscv.outputs.cache-hit != 'true'
#run: find $GITHUB_WORKSPACE/rv64gcv-install-next -type f | xargs -i strip -g {} || true
- name: configure
run: export RISCV_ROOT_PATH=/data/action/osd/rv64gcv-install-next && mkdir build && cd build && cmake -DCMAKE_TOOLCHAIN_FILE=../toolchains/riscv64-unknown-linux-gnu.toolchain.cmake -DNCNN_BUILD_TOOLS=OFF -DNCNN_BUILD_EXAMPLES=OFF -DNCNN_BUILD_TESTS=ON ..
- name: build
run: cmake --build build -j 4
- name: test-vlen256
run: |
export PATH=/data/action/osd/qemu-install/bin:$PATH
cd build
TESTS_EXECUTABLE_LOADER=qemu-riscv64 TESTS_EXECUTABLE_LOADER_ARGUMENTS="-cpu;rv64,v=true,Zfh=true,vlen=256,elen=64,vext_spec=v1.0;-L;/data/action/osd/rv64gcv-install-next/sysroot" ctest --output-on-failure -j 4
- name: test-vlen128
run: |
export PATH=/data/action/osd/qemu-install/bin:$PATH
cd build
TESTS_EXECUTABLE_LOADER=qemu-riscv64 TESTS_EXECUTABLE_LOADER_ARGUMENTS="-cpu;rv64,v=true,Zfh=true,vlen=128,elen=64,vext_spec=v1.0;-L;/data/action/osd/rv64gcv-install-next/sysroot" ctest --output-on-failure -j 4