mirror of
https://github.com/hiyouga/LlamaFactory.git
synced 2026-03-16 22:33:09 +00:00
Compare commits
3 Commits
a3d44e3152
...
246192abd2
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
246192abd2 | ||
|
|
0258dc14d0 | ||
|
|
3045adf0ba |
@@ -1,6 +1,6 @@
|
|||||||
# https://hub.docker.com/r/ascendai/cann/tags
|
# https://hub.docker.com/r/ascendai/cann/tags
|
||||||
|
|
||||||
ARG BASE_IMAGE=quay.io/ascend/cann:8.3.rc2-910b-ubuntu22.04-py3.11
|
ARG BASE_IMAGE=quay.io/ascend/cann:8.5.1-910b-ubuntu22.04-py3.11
|
||||||
FROM ${BASE_IMAGE}
|
FROM ${BASE_IMAGE}
|
||||||
|
|
||||||
# Installation arguments
|
# Installation arguments
|
||||||
@@ -33,9 +33,11 @@ RUN pip config set global.index-url "${PIP_INDEX}" && \
|
|||||||
COPY . /app
|
COPY . /app
|
||||||
|
|
||||||
# Install torch-npu
|
# Install torch-npu
|
||||||
RUN pip uninstall -y torch torchvision torchaudio && \
|
RUN source /usr/local/Ascend/ascend-toolkit/set_env.sh
|
||||||
pip install --no-cache-dir "torch==2.7.1" "torch-npu==2.7.1" "torchvision==0.22.1" "torchaudio==2.7.1" --index-url "${PYTORCH_INDEX}" && \
|
RUN pip uninstall -y torch torchvision torchaudio
|
||||||
pip install --no-cache-dir -e . --no-build-isolation && \
|
RUN pip install --no-cache-dir -r requirements/npu.txt --index-url "${PYTORCH_INDEX}"
|
||||||
|
RUN pip install --no-cache-dir -r requirements/deepspeed.txt
|
||||||
|
RUN pip install --no-cache-dir -e . --no-build-isolation && \
|
||||||
pip install --no-cache-dir -r requirements/metrics.txt --no-build-isolation
|
pip install --no-cache-dir -r requirements/metrics.txt --no-build-isolation
|
||||||
|
|
||||||
# Set up volumes
|
# Set up volumes
|
||||||
|
|||||||
@@ -33,7 +33,7 @@ services:
|
|||||||
dockerfile: ./docker/docker-npu/Dockerfile
|
dockerfile: ./docker/docker-npu/Dockerfile
|
||||||
context: ../..
|
context: ../..
|
||||||
args:
|
args:
|
||||||
BASE_IMAGE: quay.io/ascend/cann:8.3.rc2-a3-ubuntu22.04-py3.11
|
BASE_IMAGE: quay.io/ascend/cann:8.5.1-a3-ubuntu22.04-py3.11
|
||||||
PIP_INDEX: https://pypi.org/simple
|
PIP_INDEX: https://pypi.org/simple
|
||||||
container_name: llamafactory-a3
|
container_name: llamafactory-a3
|
||||||
image: llamafactory:npu-a3
|
image: llamafactory:npu-a3
|
||||||
|
|||||||
@@ -1,4 +1,4 @@
|
|||||||
torch==2.7.1
|
torch==2.7.1
|
||||||
torch-npu==2.7.1
|
torch-npu==2.7.1.post2
|
||||||
torchvision==0.22.1
|
torchvision==0.22.1
|
||||||
torchaudio==2.7.1
|
torchaudio==2.7.1
|
||||||
|
|||||||
@@ -161,7 +161,9 @@ class MMPluginMixin:
|
|||||||
video_processor: BaseImageProcessor = getattr(
|
video_processor: BaseImageProcessor = getattr(
|
||||||
processor, "video_processor", getattr(processor, "image_processor", None)
|
processor, "video_processor", getattr(processor, "image_processor", None)
|
||||||
)
|
)
|
||||||
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None)
|
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None) or getattr(
|
||||||
|
processor, "audio_processor", None
|
||||||
|
)
|
||||||
if len(images) != 0 and self.image_token is None:
|
if len(images) != 0 and self.image_token is None:
|
||||||
raise ValueError(
|
raise ValueError(
|
||||||
"This model does not support image input. Please check whether the correct `template` is used."
|
"This model does not support image input. Please check whether the correct `template` is used."
|
||||||
@@ -390,7 +392,9 @@ class MMPluginMixin:
|
|||||||
mm_inputs.update(video_processor(videos, return_tensors="pt"))
|
mm_inputs.update(video_processor(videos, return_tensors="pt"))
|
||||||
|
|
||||||
if len(audios) != 0:
|
if len(audios) != 0:
|
||||||
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None)
|
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None) or getattr(
|
||||||
|
processor, "audio_processor", None
|
||||||
|
)
|
||||||
audios = self._regularize_audios(
|
audios = self._regularize_audios(
|
||||||
audios,
|
audios,
|
||||||
sampling_rate=getattr(processor, "audio_sampling_rate", 16000),
|
sampling_rate=getattr(processor, "audio_sampling_rate", 16000),
|
||||||
@@ -1876,7 +1880,9 @@ class Qwen2OmniPlugin(Qwen2VLPlugin):
|
|||||||
) -> dict[str, "torch.Tensor"]:
|
) -> dict[str, "torch.Tensor"]:
|
||||||
image_processor: BaseImageProcessor = getattr(processor, "image_processor", None)
|
image_processor: BaseImageProcessor = getattr(processor, "image_processor", None)
|
||||||
video_processor: BaseVideoProcessor = getattr(processor, "video_processor", None)
|
video_processor: BaseVideoProcessor = getattr(processor, "video_processor", None)
|
||||||
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None)
|
feature_extractor: SequenceFeatureExtractor = getattr(processor, "feature_extractor", None) or getattr(
|
||||||
|
processor, "audio_processor", None
|
||||||
|
)
|
||||||
mm_inputs = {}
|
mm_inputs = {}
|
||||||
if len(images) != 0:
|
if len(images) != 0:
|
||||||
images = self._regularize_images(
|
images = self._regularize_images(
|
||||||
|
|||||||
@@ -1113,7 +1113,7 @@ register_template(
|
|||||||
register_template(
|
register_template(
|
||||||
name="gpt_oss",
|
name="gpt_oss",
|
||||||
format_user=StringFormatter(slots=["<|start|>user<|message|>{{content}}<|end|><|start|>assistant"]),
|
format_user=StringFormatter(slots=["<|start|>user<|message|>{{content}}<|end|><|start|>assistant"]),
|
||||||
format_assistant=StringFormatter(slots=["{{content}}<|end|>"]),
|
format_assistant=StringFormatter(slots=["{{content}}"]),
|
||||||
format_system=StringFormatter(slots=["<|start|>system<|message|>{{content}}<|end|>"]),
|
format_system=StringFormatter(slots=["<|start|>system<|message|>{{content}}<|end|>"]),
|
||||||
default_system="You are ChatGPT, a large language model trained by OpenAI.",
|
default_system="You are ChatGPT, a large language model trained by OpenAI.",
|
||||||
thought_words=("<|channel|>analysis<|message|>", "<|end|><|start|>assistant<|channel|>final<|message|>"),
|
thought_words=("<|channel|>analysis<|message|>", "<|end|><|start|>assistant<|channel|>final<|message|>"),
|
||||||
|
|||||||
Reference in New Issue
Block a user