mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-05-18 21:54:11 -04:00
perf: build quantization and better transformer behaviour (#28)
Fixes quantization_config and low_cpu_mem_usage to be available on PyTorch implementation only See changelog for more details on #28
This commit is contained in:
16
.github/workflows/ci.yml
vendored
16
.github/workflows/ci.yml
vendored
@@ -28,22 +28,6 @@ defaults:
|
||||
run:
|
||||
shell: bash --noprofile --norc -exo pipefail {0}
|
||||
jobs:
|
||||
codestyle_check:
|
||||
runs-on: ubuntu-latest
|
||||
if: ${{ github.event_name == 'pull_request' || github.event_name == 'push' }}
|
||||
steps:
|
||||
- uses: actions/checkout@v3
|
||||
with:
|
||||
fetch-depth: 0
|
||||
- name: Setup CI
|
||||
uses: ./.github/actions/setup-repo
|
||||
- name: Running changelog check
|
||||
run: hatch run changelog
|
||||
- name: Format and lint check
|
||||
run: hatch run fmt
|
||||
- name: Type check
|
||||
if: ${{ github.event_name == 'pull_request' }}
|
||||
run: git diff --name-only --diff-filter=AM "origin/$GITHUB_BASE_REF" -z -- '*.py{,i}' | xargs -0 --no-run-if-empty hatch run dev:typing
|
||||
tests:
|
||||
runs-on: ubuntu-latest
|
||||
if: ${{ github.event_name == 'pull_request' || github.event_name == 'push' }}
|
||||
|
||||
Reference in New Issue
Block a user