squash a long, messy history of mostly merges

Signed-off-by: Dave Lee <[email protected]>
mudler · May 23, 2024 · b43ca24 · b43ca24
1 parent 8c542fc
commit b43ca24
Show file tree

Hide file tree

Showing 295 changed files with 26,709 additions and 2,782 deletions.
diff --git a/.dockerignore b/.dockerignore
@@ -6,6 +6,11 @@ examples/chatbot-ui/models
 examples/rwkv/models
 examples/**/models
 Dockerfile*
+__pycache__
 
 # SonarQube
-.scannerwork
+.scannerwork
+
+# backend virtual environments
+**/venv
+backend/python/**/source
diff --git a/.env b/.env
@@ -71,6 +71,11 @@
 ### Define the number of parallel LLAMA.cpp workers (Defaults to 1)
 # LLAMACPP_PARALLEL=1
 
+### Define a list of GRPC Servers for llama-cpp workers to distribute the load
+# https://github.com/ggerganov/llama.cpp/pull/6829
+# https://github.com/ggerganov/llama.cpp/blob/master/examples/rpc/README.md
+# LLAMACPP_GRPC_SERVERS=""
+
 ### Enable to run parallel requests
 # LOCALAI_PARALLEL_REQUESTS=true
 

diff --git a/.github/checksum_checker.sh b/.github/checksum_checker.sh
@@ -0,0 +1,126 @@
+#!/bin/bash
+# This scripts needs yq and huggingface_hub to be installed
+# to install hugingface_hub run pip install huggingface_hub
+
+# Path to the input YAML file
+input_yaml=$1
+
+# Function to download file and check checksum using Python
+function check_and_update_checksum() {
+ model_name="$1"
+ file_name="$2"
+ uri="$3"
+ old_checksum="$4"
+ idx="$5"
+
+ # Download the file and calculate new checksum using Python
+ new_checksum=$(python3 -c "
+import hashlib
+from huggingface_hub import hf_hub_download, get_paths_info
+import requests
+import sys
+import os
+
+uri = '$uri'
+file_name = uri.split('/')[-1]
+
+# Function to parse the URI and determine download method
+# Function to parse the URI and determine download method
+def parse_uri(uri):
+ if uri.startswith('huggingface://'):
+ repo_id = uri.split('://')[1]
+ return 'huggingface', repo_id.rsplit('/', 1)[0]
+ elif 'huggingface.co' in uri:
+ parts = uri.split('/resolve/')
+ if len(parts) > 1:
+ repo_path = parts[0].split('https://huggingface.co/')[-1]
+ return 'huggingface', repo_path
+ return 'direct', uri
+
+def calculate_sha256(file_path):
+ sha256_hash = hashlib.sha256()
+ with open(file_path, 'rb') as f:
+ for byte_block in iter(lambda: f.read(4096), b''):
+ sha256_hash.update(byte_block)
+ return sha256_hash.hexdigest()
+
+download_type, repo_id_or_url = parse_uri(uri)
+
+new_checksum = None
+
+# Decide download method based on URI type
+if download_type == 'huggingface':
+ # Use HF API to pull sha
+ for file in get_paths_info(repo_id_or_url, [file_name], repo_type='model'):
+ try:
+ new_checksum = file.lfs.sha256
+ break
+ except Exception as e:
+ print(f'Error from Hugging Face Hub: {str(e)}', file=sys.stderr)
+ sys.exit(2)
+ if new_checksum is None:
+ try:
+ file_path = hf_hub_download(repo_id=repo_id_or_url, filename=file_name)
+ except Exception as e:
+ print(f'Error from Hugging Face Hub: {str(e)}', file=sys.stderr)
+ sys.exit(2)
+else:
+ response = requests.get(repo_id_or_url)
+ if response.status_code == 200:
+ with open(file_name, 'wb') as f:
+ f.write(response.content)
+ file_path = file_name
+ elif response.status_code == 404:
+ print(f'File not found: {response.status_code}', file=sys.stderr)
+ sys.exit(2)
+ else:
+ print(f'Error downloading file: {response.status_code}', file=sys.stderr)
+ sys.exit(1)
+
+if new_checksum is None:
+ new_checksum = calculate_sha256(file_path)
+ print(new_checksum)
+ os.remove(file_path)
+else:
+ print(new_checksum)
+
+")
+
+ if [[ "$new_checksum" == "" ]]; then
+ echo "Error calculating checksum for $file_name. Skipping..."
+ return
+ fi
+
+ echo "Checksum for $file_name: $new_checksum"
+
+ # Compare and update the YAML file if checksums do not match
+ result=$?
+ if [[ $result -eq 2 ]]; then
+ echo "File not found, deleting entry for $file_name..."
+ # yq eval -i "del(.[$idx].files[] | select(.filename == \"$file_name\"))" "$input_yaml"
+ elif [[ "$old_checksum" != "$new_checksum" ]]; then
+ echo "Checksum mismatch for $file_name. Updating..."
+ yq eval -i "del(.[$idx].files[] | select(.filename == \"$file_name\").sha256)" "$input_yaml"
+ yq eval -i "(.[$idx].files[] | select(.filename == \"$file_name\")).sha256 = \"$new_checksum\"" "$input_yaml"
+ elif [[ $result -ne 0 ]]; then
+ echo "Error downloading file $file_name. Skipping..."
+ else
+ echo "Checksum match for $file_name. No update needed."
+ fi
+}
+
+# Read the YAML and process each file
+len=$(yq eval '. | length' "$input_yaml")
+for ((i=0; i<$len; i++))
+do
+ name=$(yq eval ".[$i].name" "$input_yaml")
+ files_len=$(yq eval ".[$i].files | length" "$input_yaml")
+ for ((j=0; j<$files_len; j++))
+ do
+ filename=$(yq eval ".[$i].files[$j].filename" "$input_yaml")
+ uri=$(yq eval ".[$i].files[$j].uri" "$input_yaml")
+ checksum=$(yq eval ".[$i].files[$j].sha256" "$input_yaml")
+ echo "Checking model $name, file $filename. URI = $uri, Checksum = $checksum"
+ check_and_update_checksum "$name" "$filename" "$uri" "$checksum" "$i"
+ done
+done
diff --git a/.github/workflows/checksum_checker.yaml b/.github/workflows/checksum_checker.yaml
@@ -0,0 +1,47 @@
+name: Check if checksums are up-to-date
+on:
+ schedule:
+ - cron: 0 20 * * *
+ workflow_dispatch:
+jobs:
+ checksum_check:
+ runs-on: arc-runner-set
+ steps:
+ - name: Force Install GIT latest
+ run: |
+ sudo apt-get update \
+ && sudo apt-get install -y software-properties-common \
+ && sudo apt-get update \
+ && sudo add-apt-repository -y ppa:git-core/ppa \
+ && sudo apt-get update \
+ && sudo apt-get install -y git
+ - uses: actions/checkout@v4
+ - name: Install dependencies
+ run: |
+ sudo apt-get update
+ sudo apt-get install -y pip wget
+ sudo pip install --upgrade pip 
+ pip install huggingface_hub
+ - name: 'Setup yq'
+ uses: dcarbone/[email protected]
+ with:
+ version: 'v4.43.1'
+ download-compressed: true
+ force: true
+
+ - name: Checksum checker 🔧
+ run: |
+ export HF_HOME=/hf_cache
+ sudo mkdir /hf_cache
+ sudo chmod 777 /hf_cache
+ bash .github/checksum_checker.sh gallery/index.yaml
+ - name: Create Pull Request
+ uses: peter-evans/create-pull-request@v6
+ with:
+ token: ${{ secrets.UPDATE_BOT_TOKEN }}
+ push-to-fork: ci-forks/LocalAI
+ commit-message: ':arrow_up: Checksum updates in gallery/index.yaml'
+ title: 'models(gallery): :arrow_up: update checksum'
+ branch: "update/checksum"
+ body: Updating checksums in gallery/index.yaml
+ signoff: true
diff --git a/.github/workflows/generate_grpc_cache.yaml b/.github/workflows/generate_grpc_cache.yaml
@@ -84,7 +84,7 @@ jobs:
  build-args: |
  GRPC_BASE_IMAGE=${{ matrix.grpc-base-image }}
  GRPC_MAKEFLAGS=--jobs=4 --output-sync=target
- GRPC_VERSION=v1.63.0
+ GRPC_VERSION=v1.64.0
  context: .
  file: ./Dockerfile
  cache-to: type=gha,ignore-error=true

diff --git a/.github/workflows/generate_intel_image.yaml b/.github/workflows/generate_intel_image.yaml
@@ -0,0 +1,59 @@
+name: 'generate and publish intel docker caches'
+
+on:
+ workflow_dispatch:
+ push:
+ branches:
+ - master
+
+concurrency:
+ group: intel-cache-${{ github.head_ref || github.ref }}-${{ github.repository }}
+ cancel-in-progress: true
+
+jobs:
+ generate_caches:
+ strategy:
+ matrix:
+ include:
+ - base-image: intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04
+ runs-on: 'ubuntu-latest'
+ platforms: 'linux/amd64'
+ runs-on: ${{matrix.runs-on}}
+ steps:
+ - name: Set up QEMU
+ uses: docker/setup-qemu-action@master
+ with:
+ platforms: all
+ - name: Login to DockerHub
+ if: github.event_name != 'pull_request'
+ uses: docker/login-action@v3
+ with:
+ username: ${{ secrets.DOCKERHUB_USERNAME }}
+ password: ${{ secrets.DOCKERHUB_PASSWORD }}
+
+ - name: Login to quay
+ if: github.event_name != 'pull_request'
+ uses: docker/login-action@v3
+ with:
+ registry: quay.io
+ username: ${{ secrets.LOCALAI_REGISTRY_USERNAME }}
+ password: ${{ secrets.LOCALAI_REGISTRY_PASSWORD }}
+ - name: Set up Docker Buildx
+ id: buildx
+ uses: docker/setup-buildx-action@master
+
+ - name: Checkout
+ uses: actions/checkout@v4
+
+ - name: Cache Intel images
+ uses: docker/build-push-action@v5
+ with:
+ builder: ${{ steps.buildx.outputs.name }}
+ build-args: |
+ BASE_IMAGE=${{ matrix.base-image }}
+ context: .
+ file: ./Dockerfile
+ tags: quay.io/go-skynet/intel-oneapi-base:latest
+ push: true
+ target: intel
+ platforms: ${{ matrix.platforms }}
diff --git a/.github/workflows/image-pr.yml b/.github/workflows/image-pr.yml
@@ -68,7 +68,7 @@ jobs:
  - build-type: 'sycl_f16'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: 'sycl-f16-ffmpeg'
  ffmpeg: 'true'
@@ -110,7 +110,7 @@ jobs:
  - build-type: 'sycl_f16'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: 'sycl-f16-ffmpeg-core'
  ffmpeg: 'true'

diff --git a/.github/workflows/image.yml b/.github/workflows/image.yml
@@ -148,7 +148,7 @@ jobs:
  - build-type: 'sycl_f16'
  platforms: 'linux/amd64'
  tag-latest: 'auto'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f16-ffmpeg'
  ffmpeg: 'true'
@@ -161,7 +161,7 @@ jobs:
  - build-type: 'sycl_f32'
  platforms: 'linux/amd64'
  tag-latest: 'auto'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f32-ffmpeg'
  ffmpeg: 'true'
@@ -175,7 +175,7 @@ jobs:
  - build-type: 'sycl_f16'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f16-core'
  ffmpeg: 'false'
@@ -185,7 +185,7 @@ jobs:
  - build-type: 'sycl_f32'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f32-core'
  ffmpeg: 'false'
@@ -195,7 +195,7 @@ jobs:
  - build-type: 'sycl_f16'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f16-ffmpeg-core'
  ffmpeg: 'true'
@@ -205,7 +205,7 @@ jobs:
  - build-type: 'sycl_f32'
  platforms: 'linux/amd64'
  tag-latest: 'false'
- base-image: "intel/oneapi-basekit:2024.1.0-devel-ubuntu22.04"
+ base-image: "quay.io/go-skynet/intel-oneapi-base:latest"
  grpc-base-image: "ubuntu:22.04"
  tag-suffix: '-sycl-f32-ffmpeg-core'
  ffmpeg: 'true'

diff --git a/.github/workflows/image_build.yml b/.github/workflows/image_build.yml
@@ -218,7 +218,7 @@ jobs:
  BASE_IMAGE=${{ inputs.base-image }}
  GRPC_BASE_IMAGE=${{ inputs.grpc-base-image || inputs.base-image }}
  GRPC_MAKEFLAGS=--jobs=4 --output-sync=target
- GRPC_VERSION=v1.63.0
+ GRPC_VERSION=v1.64.0
  MAKEFLAGS=${{ inputs.makeflags }}
  context: .
  file: ./Dockerfile