Skip to content

Commit

Permalink
remove fastertransformer build and release in DJLServing (#1241)
Browse files Browse the repository at this point in the history
  • Loading branch information
Qing Lan authored Oct 31, 2023
1 parent 6d982f4 commit 0995b65
Show file tree
Hide file tree
Showing 20 changed files with 14 additions and 1,024 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/docker-nightly-publish.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ jobs:
runs-on: ubuntu-latest
strategy:
matrix:
arch: [ cpu, cpu-full, pytorch-inf2, pytorch-cu118, fastertransformer, tensorrt-llm ]
arch: [ cpu, cpu-full, pytorch-inf2, pytorch-cu118, tensorrt-llm ]
steps:
- name: Clean disk space
run: |
Expand Down
346 changes: 3 additions & 343 deletions .github/workflows/llm_integration.yml

Large diffs are not rendered by default.

14 changes: 0 additions & 14 deletions .github/workflows/sagemaker-integration.yml
Original file line number Diff line number Diff line change
Expand Up @@ -98,13 +98,6 @@ jobs:
python3 llm/sagemaker-endpoint-tests.py opt-1-3-b djl ${{ github.event.inputs.mode || 'nightly' }}
echo "sleep 30 seconds to allow endpoint deletion"
sleep 30
- name: Test flan-t5-xxl
if: success() || failure()
working-directory: tests/integration
run: |
python3 llm/sagemaker-endpoint-tests.py flan-t5-xxl djl ${{ github.event.inputs.mode || 'nightly' }}
echo "sleep 30 seconds to allow endpoint deletion"
sleep 30
endpoint-tests-group-2:
runs-on: [ self-hosted, cpu ]
Expand Down Expand Up @@ -142,13 +135,6 @@ jobs:
python3 llm/sagemaker-endpoint-tests.py gpt-neo-2-7-b no_code ${{ github.event.inputs.mode || 'nightly' }}
echo "sleep 30 seconds to allow endpoint deletion"
sleep 30
- name: Test bloom-7b1 no code FasterTransformer
if: success() || failure()
working-directory: tests/integration
run: |
python3 llm/sagemaker-endpoint-tests.py bloom-7b1 no_code ${{ github.event.inputs.mode || 'nightly' }}
echo "sleep 30 seconds to allow endpoint deletion"
sleep 30
- name: Test DeepSpeed pythia-12b
if: success() || failure()
working-directory: tests/integration
Expand Down
218 changes: 0 additions & 218 deletions engines/python/setup/djl_python/fastertransformer.py

This file was deleted.

Original file line number Diff line number Diff line change
Expand Up @@ -34,16 +34,6 @@ public int getEngineRank() {
return PyEngine.RANK + 1;
}

/** {@code FtEngineProvider} is the alias of {@link MpiEngineProvider}. */
public static final class FtEngineProvider extends MpiEngineProvider {

/** {@inheritDoc} */
@Override
public String getEngineName() {
return "FasterTransformer";
}
}

/** {@code DsEngineProvider} is the alias of {@link MpiEngineProvider}. */
public static final class DsEngineProvider extends MpiEngineProvider {

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -160,8 +160,6 @@ public void load(Path modelPath, String prefix, Map<String, ?> options) throws I
entryPoint = modelFile.toFile().getName();
} else if ("DeepSpeed".equals(engineName)) {
entryPoint = "djl_python.deepspeed";
} else if ("FasterTransformer".equals(engineName)) {
entryPoint = "djl_python.fastertransformer";
} else if ("nc".equals(manager.getDevice().getDeviceType())
&& pyEnv.getTensorParallelDegree() > 0) {
entryPoint = "djl_python.transformers_neuronx";
Expand Down
Original file line number Diff line number Diff line change
@@ -1,4 +1,3 @@
ai.djl.python.engine.PyEngineProvider
ai.djl.python.engine.MpiEngineProvider
ai.djl.python.engine.MpiEngineProvider$FtEngineProvider
ai.djl.python.engine.MpiEngineProvider$DsEngineProvider
5 changes: 0 additions & 5 deletions serving/docker/docker-compose.yml
Original file line number Diff line number Diff line change
Expand Up @@ -28,11 +28,6 @@ services:
target: base
dockerfile: pytorch-cu118.Dockerfile
image: "deepjavalibrary/djl-serving:${RELEASE_VERSION}pytorch-cu118${NIGHTLY}"
fastertransformer:
build:
context: .
dockerfile: fastertransformer.Dockerfile
image: "deepjavalibrary/djl-serving:${RELEASE_VERSION}fastertransformer${NIGHTLY}"
tensorrt-llm:
build:
context: .
Expand Down
Loading

0 comments on commit 0995b65

Please sign in to comment.