vllm-project · jkaniecki · Oct 14, 2024 · Oct 14, 2024 · Oct 14, 2024 · Oct 14, 2024
diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS
@@ -1,33 +1,4 @@
 # See https://help.github.com/articles/about-codeowners/
 # for more info about CODEOWNERS file
 
-# This lists cover the "core" components of vLLM that require careful review
-/vllm/attention/backends/abstract.py @WoosukKwon @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/core @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/engine/llm_engine.py @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/executor/executor_base.py @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/worker/worker_base.py @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/worker/worker.py @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-/vllm/model_executor/layers/sampler.py @zhuohan123 @youkaichao @alexm-neuralmagic @comaniac @njhill
-CMakeLists.txt @tlrmchlsmth
-
-# vLLM V1
-/vllm/v1 @WoosukKwon @robertgshaw2-neuralmagic @njhill @ywang96 @comaniac @alexm-neuralmagic
-
-# Test ownership
-/tests/async_engine @njhill @robertgshaw2-neuralmagic @simon-mo
-/tests/test_inputs.py @DarkLight1337 @ywang96
-/tests/entrypoints @DarkLight1337 @robertgshaw2-neuralmagic @simon-mo
-/tests/models @DarkLight1337 @ywang96
-/tests/multimodal @DarkLight1337 @ywang96
-/tests/prefix_caching @comaniac @KuntaiDu
-/tests/spec_decode @njhill @LiuXiaoxuanPKU
-/tests/kernels @tlrmchlsmth @WoosukKwon
-/tests/quantization @mgoin @robertgshaw2-neuralmagic
-/.buildkite/lm-eval-harness @mgoin @simon-mo
-/tests/distributed/test_multi_node_assignment.py @youkaichao
-/tests/distributed/test_pipeline_parallel.py @youkaichao
-/tests/distributed/test_same_node.py @youkaichao
-/tests/multi_step @alexm-neuralmagic @comaniac
-/tests/weight_loading @mgoin @youkaichao
-/tests/basic_correctness/test_chunked_prefill @rkooo567 @comaniac
+* @kzawora-intel @madamczykhabana @michalkuligowski @mgawarkiewicz @vivekgoe @afierka-intel
diff --git a/.github/actionlint.yaml b/.github/actionlint.yaml
@@ -0,0 +1,10 @@
+self-hosted-runner:
+  # Labels of self-hosted runner in array of strings.
+  labels:
+    - generic-runner
+paths:
+  .github/workflows/trigger_jenkins.yml:
+    ignore:
+      - shellcheck reported issue in this script: SC2116:.+
+      - shellcheck reported issue in this script: SC2086:.+ 
+      - shellcheck reported issue in this script: SC2001:.+    
diff --git a/.github/workflows/actionlint.yml b/.github/workflows/actionlint.yml
@@ -2,14 +2,14 @@ name: Lint GitHub Actions workflows
 on:
   push:
     branches:
-      - "main"
+      - "habana_main"
     paths:
       - '.github/workflows/*.ya?ml'
       - '.github/workflows/actionlint.*'
       - '.github/workflows/matchers/actionlint.json'
   pull_request:
     branches:
-      - "main"
+      - "habana_main"
     paths:
       - '.github/workflows/*.ya?ml'
       - '.github/workflows/actionlint.*'

diff --git a/.github/workflows/clang-format.yml b/.github/workflows/clang-format.yml
@@ -2,10 +2,10 @@ name: clang-format
 
 on:
   # Trigger the workflow on push or pull request,
-  # but only for the main branch
+  # but only for the habana_main branch
   push:
     branches:
-      - main
+      - habana_main
     paths:
       - '**/*.h'
       - '**/*.cpp'
@@ -14,7 +14,7 @@ on:
       - '.github/workflows/clang-format.yml'
   pull_request:
     branches:
-      - main
+      - habana_main
     paths:
       - '**/*.h'
       - '**/*.cpp'

diff --git a/.github/workflows/codespell.yml b/.github/workflows/codespell.yml
@@ -5,7 +5,7 @@ on:
   # but only for the main branch
   push:
     branches:
-      - main
+      - habana_main
     paths:
       - "**/*.py"
       - "**/*.md"
@@ -15,7 +15,7 @@ on:
       - .github/workflows/codespell.yml
   pull_request:
     branches:
-      - main
+      - habana_main
     paths:
       - "**/*.py"
       - "**/*.md"

diff --git a/.github/workflows/cpu-test.yml b/.github/workflows/cpu-test.yml
@@ -0,0 +1,35 @@
+name: cpu-test
+
+on:
+  # Trigger the workflow on push or pull request,
+  # but only for the habana_main branch
+  push:
+    branches:
+      - habana_main
+  pull_request:
+    branches:
+      - habana_main
+
+
+jobs:
+  cputest:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.11"]
+    steps:
+    - uses: actions/checkout@v3
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v3
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install torch --extra-index-url https://download.pytorch.org/whl/cpu
+        pip install -r requirements-build.txt
+        pip install -r requirements-hpu.txt
+        VLLM_TARGET_DEVICE=hpu python setup.py develop
+    - name: cpu-test
+      run: |
+        VLLM_SKIP_WARMUP=true VLLM_PROMPT_SEQ_BUCKET_MAX=128 VLLM_USE_FAKE_HPU=1 python examples/offline_inference_fakehpu.py
diff --git a/.github/workflows/doc-lint.yml b/.github/workflows/doc-lint.yml
@@ -3,12 +3,12 @@ name: Lint documentation
 on:
   push:
     branches:
-      - main
+      - habana_main
     paths:
       - "docs/**"
   pull_request:
     branches:
-      - main
+      - habana_main
     paths:
       - "docs/**"
 

diff --git a/.github/workflows/lint-and-deploy.yaml b/.github/workflows/lint-and-deploy.yaml
diff --git a/.github/workflows/mypy.yaml b/.github/workflows/mypy.yaml
@@ -2,18 +2,18 @@ name: mypy
 
 on:
   # Trigger the workflow on push or pull request,
-  # but only for the main branch
+  # but only for the habana_main branch
   push:
     branches:
-      - main
+      - habana_main
     paths:
       - '**/*.py'
       - '.github/workflows/mypy.yaml'
       - 'tools/mypy.sh'
       - 'pyproject.toml'
   pull_request:
     branches:
-      - main
+      - habana_main
     # This workflow is only relevant when one of the following files changes.
     # However, we have github configured to expect and require this workflow
     # to run and pass before github with auto-merge a pull request. Until github

diff --git a/.github/workflows/png-lint.yml b/.github/workflows/png-lint.yml
@@ -2,13 +2,13 @@ name: Lint PNG exports from excalidraw
 on:
   push:
     branches:
-      - "main"
+      - "habana_main"
     paths:
       - '*.excalidraw.png'
       - '.github/workflows/png-lint.yml'
   pull_request:
     branches:
-      - "main"
+      - "habana_main"
     paths:
       - '*.excalidraw.png'
       - '.github/workflows/png-lint.yml'

diff --git a/.github/workflows/reminder_comment.yml b/.github/workflows/reminder_comment.yml
diff --git a/.github/workflows/ruff.yml b/.github/workflows/ruff.yml
@@ -2,10 +2,10 @@ name: ruff
 
 on:
   # Trigger the workflow on push or pull request,
-  # but only for the main branch
+  # but only for the habana_main branch
   push:
     branches:
-      - main
+      - habana_main
     paths:
       - "**/*.py"
       - pyproject.toml
@@ -14,7 +14,7 @@ on:
       - .github/workflows/ruff.yml
   pull_request:
     branches:
-      - main
+      - habana_main
     # This workflow is only relevant when one of the following files changes.
     # However, we have github configured to expect and require this workflow
     # to run and pass before github with auto-merge a pull request. Until github

diff --git a/.github/workflows/scorecard.yml b/.github/workflows/scorecard.yml
@@ -0,0 +1,73 @@
+# This workflow uses actions that are not certified by GitHub. They are provided
+# by a third-party and are governed by separate terms of service, privacy
+# policy, and support documentation.
+
+name: Scorecard supply-chain security
+on:
+  # For Branch-Protection check. Only the default branch is supported. See
+  # https://github.com/ossf/scorecard/blob/main/docs/checks.md#branch-protection
+  branch_protection_rule:
+  # To guarantee Maintained check is occasionally updated. See
+  # https://github.com/ossf/scorecard/blob/main/docs/checks.md#maintained
+  schedule:
+    - cron: '20 13 * * 0'
+  push:
+    branches: [ "habana_main" ]
+
+# Declare default permissions as read only.
+permissions: read-all
+
+jobs:
+  analysis:
+    name: Scorecard analysis
+    runs-on: ubuntu-latest
+    permissions:
+      # Needed to upload the results to code-scanning dashboard.
+      security-events: write
+      # Needed to publish results and get a badge (see publish_results below).
+      id-token: write
+      # Uncomment the permissions below if installing in a private repository.
+      # contents: read
+      # actions: read
+
+    steps:
+      - name: "Checkout code"
+        uses: actions/checkout@b4ffde65f46336ab88eb53be808477a3936bae11 # v4.1.1
+        with:
+          persist-credentials: false
+
+      - name: "Run analysis"
+        uses: ossf/scorecard-action@0864cf19026789058feabb7e87baa5f140aac736 # v2.3.1
+        with:
+          results_file: results.sarif
+          results_format: sarif
+          # (Optional) "write" PAT token. Uncomment the `repo_token` line below if:
+          # - you want to enable the Branch-Protection check on a *public* repository, or
+          # - you are installing Scorecard on a *private* repository
+          # To create the PAT, follow the steps in https://github.com/ossf/scorecard-action?tab=readme-ov-file#authentication-with-fine-grained-pat-optional.
+          # repo_token: ${{ secrets.SCORECARD_TOKEN }}
+
+          # Public repositories:
+          #   - Publish results to OpenSSF REST API for easy access by consumers
+          #   - Allows the repository to include the Scorecard badge.
+          #   - See https://github.com/ossf/scorecard-action#publishing-results.
+          # For private repositories:
+          #   - `publish_results` will always be set to `false`, regardless
+          #     of the value entered here.
+          publish_results: false
+
+      # Upload the results as artifacts (optional). Commenting out will disable uploads of run results in SARIF
+      # format to the repository Actions tab.
+      - name: "Upload artifact"
+        uses: actions/upload-artifact@97a0fba1372883ab732affbe8f94b823f91727db # v3.pre.node20
+        with:
+          name: SARIF file
+          path: results.sarif
+          retention-days: 5
+
+      # Upload the results to GitHub's code scanning dashboard (optional).
+      # Commenting out will disable upload of results to your repo's Code Scanning dashboard
+      - name: "Upload to code-scanning"
+        uses: github/codeql-action/upload-sarif@v3
+        with:
+          sarif_file: results.sarif