Skip to content
This repository has been archived by the owner on Oct 25, 2024. It is now read-only.

add FP8Config

add FP8Config #4581

Workflow file for this run

name: Chat Bot Test
on:
pull_request:
branches:
- main
paths:
- '.github/workflows/chatbot-test.yml'
- '.github/workflows/chatbot-inference-llama-2-7b-chat-hf.yml'
- '.github/workflows/chatbot-inference-mpt-7b-chat.yml'
- '.github/workflows/chatbot-finetune-mpt-7b-chat.yml'
- '.github/workflows/chatbot-inference-llama-2-7b-chat-hf-hpu.yml'
- '.github/workflows/chatbot-inference-mpt-7b-chat-hpu.yml'
- '.github/workflows/chatbot-finetune-mpt-7b-chat-hpu.yml'
- '.github/workflows/script/chatbot/**'
- '.github/workflows/sample_data/**'
- 'intel_extension_for_transformers/neural_chat/**'
- 'intel_extension_for_transformers/transformers/llm/finetuning/**'
- 'intel_extension_for_transformers/transformers/llm/quantization/**'
- 'intel_extension_for_transformers/transformers/**'
- 'workflows/chatbot/inference/**'
- 'workflows/chatbot/fine_tuning/**'
- '!intel_extension_for_transformers/neural_chat/docs/**'
- '!intel_extension_for_transformers/neural_chat/tests/ci/**'
- '!intel_extension_for_transformers/neural_chat/examples/**'
- '!intel_extension_for_transformers/neural_chat/assets/**'
- '!intel_extension_for_transformers/neural_chat/README.md'
workflow_dispatch:
# If there is a new commit, the previous jobs will be canceled
concurrency:
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
cancel-in-progress: true
jobs:
call-inference-llama-2-7b-chat-hf:
uses: ./.github/workflows/chatbot-inference-llama-2-7b-chat-hf.yml
call-inference-mpt-7b-chat:
uses: ./.github/workflows/chatbot-inference-mpt-7b-chat.yml
# call-inference-llama-2-7b-chat-hf-hpu:
# uses: ./.github/workflows/chatbot-inference-llama-2-7b_70b-chat-hf-hpu.yml
#
# call-inference-mpt-7b-chat-hpu:
# uses: ./.github/workflows/chatbot-inference-mpt-7b-chat-hpu.yml
#
# call-finetune-mpt-7b-chat-hpu:
# uses: ./.github/workflows/chatbot-finetune-mpt-7b-chat-hpu.yml