Skip to main content
Public
Browse Files
9988a287da05b7cbc8d3f04aacb27c85a9abca1c
Full Commit Hash
Commit Details
551 Added

Initial commit - Upload project 'llamafactory'

WebDev
Authored
January 23, 2026, 5:43 am
Statistics
551
Files Added
0
Files Modified
0
Files Deleted
0
Files Renamed
Changed Files 551 files
qwen2_vl_full.yaml 656 B
A Added · examples/megatron
rms_norm
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops
qwen3_moe_full.yaml 862 B
A Added · examples/megatron
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/rms_norm
merge_lora
A Added · examples
npu_rms_norm.py 3.1 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/rms_norm
qwen3_full_sft.yaml 235 B
A Added · examples/merge_lora
rope
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops
qwen3_gptq.yaml 308 B
A Added · examples/merge_lora
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/rope
qwen3_lora_sft.yaml 370 B
A Added · examples/merge_lora
npu_rope.py 5.34 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/rope
qwen3vl_lora_sft.yaml 377 B
A Added · examples/merge_lora
registry.py 3.09 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels
README_zh.md 6.72 KB
A Added · examples
peft.py 1.74 KB
A Added · src/llamafactory/v1/plugins/model_plugins
README.md 6.87 KB
A Added · examples
quantization.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins
train_full
A Added · examples
rendering.py 8.72 KB
A Added · src/llamafactory/v1/plugins/model_plugins
qwen3_full_sft.yaml 995 B
A Added · examples/train_full
sampler_plugins
A Added · src/llamafactory/v1/plugins
qwen3vl_full_sft.yaml 1.02 KB
A Added · examples/train_full
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/sampler_plugins
train_lora
A Added · examples
vllm.py 0 B
A Added · src/llamafactory/v1/plugins/sampler_plugins
qwen3_lora_dpo.yaml 967 B
A Added · examples/train_lora
trainer_plugins
A Added · src/llamafactory/v1/plugins
qwen3_lora_kto.yaml 827 B
A Added · examples/train_lora
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/trainer_plugins
qwen3_lora_pretrain.yaml 864 B
A Added · examples/train_lora
batching.py 1.32 KB
A Added · src/llamafactory/v1/plugins/trainer_plugins
qwen3_lora_reward.yaml 894 B
A Added · examples/train_lora
distributed
A Added · src/llamafactory/v1/plugins/trainer_plugins
qwen3_lora_sft_ds3.yaml 1 KB
A Added · examples/train_lora
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/trainer_plugins/distributed
qwen3_lora_sft_ray.yaml 1.26 KB
A Added · examples/train_lora
accelerate.py 0 B
A Added · src/llamafactory/v1/plugins/trainer_plugins/distributed
qwen3_lora_sft.sh 873 B
A Added · examples/train_lora
deepspeed.py 0 B
A Added · src/llamafactory/v1/plugins/trainer_plugins/distributed
qwen3_lora_sft.yaml 907 B
A Added · examples/train_lora
lr_scheduler.py 674 B
A Added · src/llamafactory/v1/plugins/trainer_plugins
qwen3_preprocess.yaml 436 B
A Added · examples/train_lora
optimizer.py 672 B
A Added · src/llamafactory/v1/plugins/trainer_plugins
qwen3vl_lora_dpo.yaml 987 B
A Added · examples/train_lora
samplers
A Added · src/llamafactory/v1
qwen3vl_lora_sft.yaml 965 B
A Added · examples/train_lora
cli_sampler.py 4.2 KB
A Added · src/llamafactory/v1/samplers
train_qlora
A Added · examples
trainers
A Added · src/llamafactory/v1
llama3_lora_sft_aqlm.yaml 865 B
A Added · examples/train_qlora
__init__.py 0 B
A Added · src/llamafactory/v1/trainers
llama3_lora_sft_awq.yaml 853 B
A Added · examples/train_qlora
dpo_trainer.py 0 B
A Added · src/llamafactory/v1/trainers
llama3_lora_sft_gptq.yaml 854 B
A Added · examples/train_qlora
rm_trainer.py 0 B
A Added · src/llamafactory/v1/trainers
qwen3_lora_sft_bnb_npu.yaml 919 B
A Added · examples/train_qlora
sft_trainer.py 1.86 KB
A Added · src/llamafactory/v1/trainers
qwen3_lora_sft_otfq.yaml 983 B
A Added · examples/train_qlora
utils
A Added · src/llamafactory/v1
LICENSE 11.06 KB
A Added · .
__init__.py 0 B
A Added · src/llamafactory/v1/utils
Makefile 741 B
A Added · .
constants.py 607 B
A Added · src/llamafactory/v1/utils
MANIFEST.in 16 B
A Added · .
dtype.py 3.27 KB
A Added · src/llamafactory/v1/utils
pyproject.toml 3.31 KB
A Added · .
env.py 1.03 KB
A Added · src/llamafactory/v1/utils
README_zh.md 66.98 KB
A Added · .
helper.py 2.74 KB
A Added · src/llamafactory/v1/utils
README.md 68.13 KB
A Added · .
logging.py 3.97 KB
A Added · src/llamafactory/v1/utils
requirements
A Added · .
objects.py 2.37 KB
A Added · src/llamafactory/v1/utils
adam-mini.txt 10 B
A Added · requirements
packages.py 1.38 KB
A Added · src/llamafactory/v1/utils
apollo.txt 13 B
A Added · requirements
plugin.py 3.06 KB
A Added · src/llamafactory/v1/utils
aqlm.txt 17 B
A Added · requirements
pytest.py 1.15 KB
A Added · src/llamafactory/v1/utils
badam.txt 13 B
A Added · requirements
types.py 5.8 KB
A Added · src/llamafactory/v1/utils
bitsandbytes.txt 21 B
A Added · requirements
webui
A Added · src/llamafactory
deepspeed.txt 27 B
A Added · requirements
__init__.py 0 B
A Added · src/llamafactory/webui
dev.txt 29 B
A Added · requirements
chatter.py 8.91 KB
A Added · src/llamafactory/webui
eetq.txt 5 B
A Added · requirements
common.py 9.31 KB
A Added · src/llamafactory/webui
fp8-te.txt 54 B
A Added · requirements
components
A Added · src/llamafactory/webui
fp8.txt 34 B
A Added · requirements
__init__.py 1004 B
A Added · src/llamafactory/webui/components
galore.txt 13 B
A Added · requirements
chatbot.py 4.58 KB
A Added · src/llamafactory/webui/components
gptq.txt 33 B
A Added · requirements
data.py 4.39 KB
A Added · src/llamafactory/webui/components
hqq.txt 4 B
A Added · requirements
eval.py 3.37 KB
A Added · src/llamafactory/webui/components
liger-kernel.txt 20 B
A Added · requirements
export.py 5.63 KB
A Added · src/llamafactory/webui/components
metrics.txt 25 B
A Added · requirements
footer.py 1.42 KB
A Added · src/llamafactory/webui/components
minicpm-v.txt 109 B
A Added · requirements
infer.py 2.51 KB
A Added · src/llamafactory/webui/components
npu.txt 68 B
A Added · requirements
top.py 3.8 KB
A Added · src/llamafactory/webui/components
openmind.txt 9 B
A Added · requirements
train.py 16.56 KB
A Added · src/llamafactory/webui/components
sglang.txt 40 B
A Added · requirements
control.py 7.98 KB
A Added · src/llamafactory/webui
swanlab.txt 8 B
A Added · requirements
css.py 1.62 KB
A Added · src/llamafactory/webui
vllm.txt 21 B
A Added · requirements
engine.py 3.52 KB
A Added · src/llamafactory/webui
scripts
A Added · .
interface.py 4.01 KB
A Added · src/llamafactory/webui
api_example
A Added · scripts
locales.py 105.76 KB
A Added · src/llamafactory/webui
test_image.py 2.26 KB
A Added · scripts/api_example
manager.py 2.54 KB
A Added · src/llamafactory/webui
test_toolcall.py 3.01 KB
A Added · scripts/api_example
runner.py 22.06 KB
A Added · src/llamafactory/webui
bench_qwen.py 6.93 KB
A Added · scripts
train.py 762 B
A Added · src
convert_ckpt
A Added · scripts
webui.py 1.13 KB
A Added · src
llamafy_baichuan2.py 4.58 KB
A Added · scripts/convert_ckpt
tests
A Added · .
llamafy_qwen.py 7.33 KB
A Added · scripts/convert_ckpt
tests_v1
A Added · .
tiny_llama4.py 1.38 KB
A Added · scripts/convert_ckpt
accelerator
A Added · tests_v1
tiny_qwen3.py 1.19 KB
A Added · scripts/convert_ckpt
test_interface.py 2.41 KB
A Added · tests_v1/accelerator
eval_bleu_rouge.py 2.51 KB
A Added · scripts
config
A Added · tests_v1
llama_pro.py 5.27 KB
A Added · scripts
test_args_parser.py 2.7 KB
A Added · tests_v1/config
loftq_init.py 3.24 KB
A Added · scripts
conftest.py 5.92 KB
A Added · tests_v1
megatron_merge.py 4.07 KB
A Added · scripts
core
A Added · tests_v1
pissa_init.py 3.13 KB
A Added · scripts
test_data_engine.py 1.36 KB
A Added · tests_v1/core
qwen_omni_merge.py 6.25 KB
A Added · scripts
test_model_loader.py 1.96 KB
A Added · tests_v1/core
stat_utils
A Added · scripts
utils
A Added · tests_v1/core
cal_flops.py 1.84 KB
A Added · scripts/stat_utils
test_batching.py 1.97 KB
A Added · tests_v1/core/utils
cal_lr.py 3.83 KB
A Added · scripts/stat_utils
test_rendering.py 10.32 KB
A Added · tests_v1/core/utils
cal_mfu.py 5.65 KB
A Added · scripts/stat_utils
plugins
A Added · tests_v1
cal_ppl.py 5.36 KB
A Added · scripts/stat_utils
data_plugins
A Added · tests_v1/plugins
length_cdf.py 2.44 KB
A Added · scripts/stat_utils
test_converter.py 5.09 KB
A Added · tests_v1/plugins/data_plugins
vllm_infer.py 11.44 KB
A Added · scripts
model_plugins
A Added · tests_v1/plugins
src
A Added · .
test_init_plugin.py 1.95 KB
A Added · tests_v1/plugins/model_plugins
api.py 1.01 KB
A Added · src
test_kernel_plugin.py 2.98 KB
A Added · tests_v1/plugins/model_plugins
.dockerignore 132 B
A Added · .
llamafactory
A Added · src
sampler
A Added · tests_v1
.env.local 705 B
A Added · .
__init__.py 1022 B
A Added · src/llamafactory
test_cli_sampler.py 1.58 KB
A Added · tests_v1/sampler
.gitattributes 66 B
A Added · .
api
A Added · src/llamafactory
check_license.py 1.19 KB
A Added · tests
.github
A Added · .
__init__.py 0 B
A Added · src/llamafactory/api
conftest.py 5.95 KB
A Added · tests
CODE_OF_CONDUCT.md 5.11 KB
A Added · .github
app.py 4.35 KB
A Added · src/llamafactory/api
data
A Added · tests
CONTRIBUTING.md 2.35 KB
A Added · .github
chat.py 11.48 KB
A Added · src/llamafactory/api
processor
A Added · tests/data
copilot-instructions.md 5.92 KB
A Added · .github
common.py 3.46 KB
A Added · src/llamafactory/api
test_feedback.py 2.18 KB
A Added · tests/data/processor
instructions-v0.md 0 B
A Added · .github
protocol.py 3.8 KB
A Added · src/llamafactory/api
test_pairwise.py 3.3 KB
A Added · tests/data/processor
instructions-v1.md 0 B
A Added · .github
chat
A Added · src/llamafactory
test_processor_utils.py 1.17 KB
A Added · tests/data/processor
ISSUE_TEMPLATE
A Added · .github
__init__.py 697 B
A Added · src/llamafactory/chat
test_supervised.py 4.49 KB
A Added · tests/data/processor
1-bug-report.yml 2.33 KB
A Added · .github/ISSUE_TEMPLATE
base_engine.py 3 KB
A Added · src/llamafactory/chat
test_unsupervised.py 2.2 KB
A Added · tests/data/processor
2-feature-request.yml 1.25 KB
A Added · .github/ISSUE_TEMPLATE
chat_model.py 7.84 KB
A Added · src/llamafactory/chat
test_collator.py 5.62 KB
A Added · tests/data
config.yml 384 B
A Added · .github/ISSUE_TEMPLATE
hf_engine.py 16.08 KB
A Added · src/llamafactory/chat
test_converter.py 2.39 KB
A Added · tests/data
PULL_REQUEST_TEMPLATE.md 233 B
A Added · .github
kt_engine.py 10.7 KB
A Added · src/llamafactory/chat
test_formatter.py 14.98 KB
A Added · tests/data
SECURITY.md 548 B
A Added · .github
sglang_engine.py 12.44 KB
A Added · src/llamafactory/chat
test_loader.py 1.91 KB
A Added · tests/data
workflows
A Added · .github
vllm_engine.py 11.62 KB
A Added · src/llamafactory/chat
test_mm_plugin.py 17.75 KB
A Added · tests/data
docker.yml 3.4 KB
A Added · .github/workflows
cli.py 884 B
A Added · src/llamafactory
test_template.py 16.53 KB
A Added · tests/data
label_issue.yml 830 B
A Added · .github/workflows
data
A Added · src/llamafactory
e2e
A Added · tests
publish.yml 651 B
A Added · .github/workflows
__init__.py 1.18 KB
A Added · src/llamafactory/data
test_chat.py 1.38 KB
A Added · tests/e2e
tests_cuda.yml 1.64 KB
A Added · .github/workflows
collator.py 14.18 KB
A Added · src/llamafactory/data
test_sglang.py 1.99 KB
A Added · tests/e2e
tests_npu.yml 1.87 KB
A Added · .github/workflows
converter.py 17.57 KB
A Added · src/llamafactory/data
test_train.py 2.19 KB
A Added · tests/e2e
tests.yml 2.6 KB
A Added · .github/workflows
data_utils.py 7.22 KB
A Added · src/llamafactory/data
eval
A Added · tests
.gitignore 3.23 KB
A Added · .
formatter.py 5.66 KB
A Added · src/llamafactory/data
test_eval_template.py 3.03 KB
A Added · tests/eval
.pre-commit-config.yaml 713 B
A Added · .
loader.py 13.66 KB
A Added · src/llamafactory/data
model
A Added · tests
assets
A Added · .
mm_plugin.py 90.78 KB
A Added · src/llamafactory/data
model_utils
A Added · tests/model
logo.png 55.52 KB
A Added · assets
parser.py 5.6 KB
A Added · src/llamafactory/data
test_add_tokens.py 1.52 KB
A Added · tests/model/model_utils
sponsors
A Added · assets
processor
A Added · src/llamafactory/data
test_attention.py 1.91 KB
A Added · tests/model/model_utils
serpapi.svg 5.98 KB
A Added · assets/sponsors
__init__.py 1.13 KB
A Added · src/llamafactory/data/processor
test_checkpointing.py 2.41 KB
A Added · tests/model/model_utils
warp.jpg 126.47 KB
A Added · assets/sponsors
feedback.py 5.91 KB
A Added · src/llamafactory/data/processor
test_misc.py 1.5 KB
A Added · tests/model/model_utils
thirdparty
A Added · assets
pairwise.py 5.51 KB
A Added · src/llamafactory/data/processor
test_packing.py 2.09 KB
A Added · tests/model/model_utils
colab.svg 2.31 KB
A Added · assets/thirdparty
pretrain.py 2.72 KB
A Added · src/llamafactory/data/processor
test_visual.py 4.94 KB
A Added · tests/model/model_utils
discord.svg 2.81 KB
A Added · assets/thirdparty
processor_utils.py 3.05 KB
A Added · src/llamafactory/data/processor
test_base.py 1.37 KB
A Added · tests/model
dsw.svg 18.45 KB
A Added · assets/thirdparty
supervised.py 9.51 KB
A Added · src/llamafactory/data/processor
test_freeze.py 2.34 KB
A Added · tests/model
lab4ai.svg 39.57 KB
A Added · assets/thirdparty
unsupervised.py 3.79 KB
A Added · src/llamafactory/data/processor
test_full.py 1.61 KB
A Added · tests/model
online.svg 58.29 KB
A Added · assets/thirdparty
template.py 89.13 KB
A Added · src/llamafactory/data
test_lora.py 3.62 KB
A Added · tests/model
CITATION.cff 1.35 KB
A Added · .
tool_utils.py 24.99 KB
A Added · src/llamafactory/data
test_pissa.py 2.09 KB
A Added · tests/model
data
A Added · .
eval
A Added · src/llamafactory
train
A Added · tests
alpaca_en_demo.json 839.74 KB
A Added · data
__init__.py 0 B
A Added · src/llamafactory/eval
test_sft_trainer.py 3.26 KB
A Added · tests/train
alpaca_zh_demo.json 621.13 KB
A Added · data
evaluator.py 7.19 KB
A Added · src/llamafactory/eval
version.txt 54 B
A Added · tests
c4_demo.jsonl 729.68 KB
A Added · data
template.py 2.8 KB
A Added · src/llamafactory/eval
dataset_info.json 17.16 KB
A Added · data
extras
A Added · src/llamafactory
dpo_en_demo.json 1.5 MB
A Added · data
__init__.py 0 B
A Added · src/llamafactory/extras
dpo_zh_demo.json 833.31 KB
A Added · data
constants.py 119.78 KB
A Added · src/llamafactory/extras
glaive_toolcall_en_demo.json 721.61 KB
A Added · data
env.py 2.98 KB
A Added · src/llamafactory/extras
glaive_toolcall_zh_demo.json 664.73 KB
A Added · data
logging.py 5.13 KB
A Added · src/llamafactory/extras
identity.json 19.83 KB
A Added · data
misc.py 11.34 KB
A Added · src/llamafactory/extras
kto_en_demo.json 892.11 KB
A Added · data
packages.py 2.89 KB
A Added · src/llamafactory/extras
mllm_audio_demo.json 877 B
A Added · data
ploting.py 3.09 KB
A Added · src/llamafactory/extras
mllm_demo_data
A Added · data
hparams
A Added · src/llamafactory
1.jpg 12.04 KB
A Added · data/mllm_demo_data
__init__.py 1.22 KB
A Added · src/llamafactory/hparams
1.mp3 126 KB
A Added · data/mllm_demo_data
data_args.py 7.51 KB
A Added · src/llamafactory/hparams
1.mp4 469.91 KB
A Added · data/mllm_demo_data
evaluation_args.py 1.98 KB
A Added · src/llamafactory/hparams
2.avi 376.71 KB
A Added · data/mllm_demo_data
finetuning_args.py 21.15 KB
A Added · src/llamafactory/hparams
2.jpg 22.15 KB
A Added · data/mllm_demo_data
generating_args.py 2.91 KB
A Added · src/llamafactory/hparams
2.wav 90.71 KB
A Added · data/mllm_demo_data
model_args.py 21.14 KB
A Added · src/llamafactory/hparams
3.flac 117.23 KB
A Added · data/mllm_demo_data
parser.py 23.2 KB
A Added · src/llamafactory/hparams
3.jpg 15.73 KB
A Added · data/mllm_demo_data
training_args.py 4.65 KB
A Added · src/llamafactory/hparams
3.mp4 264.5 KB
A Added · data/mllm_demo_data
launcher.py 6.41 KB
A Added · src/llamafactory
4.mp3 79.02 KB
A Added · data/mllm_demo_data
model
A Added · src/llamafactory
4.mp4 66.46 KB
A Added · data/mllm_demo_data
__init__.py 976 B
A Added · src/llamafactory/model
mllm_demo.json 3.22 KB
A Added · data
adapter.py 15.47 KB
A Added · src/llamafactory/model
mllm_video_audio_demo.json 1.05 KB
A Added · data
loader.py 9.79 KB
A Added · src/llamafactory/model
mllm_video_demo.json 828 B
A Added · data
model_utils
A Added · src/llamafactory/model
README_zh.md 12.67 KB
A Added · data
__init__.py 0 B
A Added · src/llamafactory/model/model_utils
README.md 13.42 KB
A Added · data
attention.py 4.44 KB
A Added · src/llamafactory/model/model_utils
reason_tool_use_demo_50.jsonl 252.75 KB
A Added · data
checkpointing.py 7.7 KB
A Added · src/llamafactory/model/model_utils
v1_dpo_demo.jsonl 28.43 KB
A Added · data
embedding.py 8.89 KB
A Added · src/llamafactory/model/model_utils
v1_dpo_demo.yaml 89 B
A Added · data
ktransformers.py 6.61 KB
A Added · src/llamafactory/model/model_utils
v1_sft_demo.jsonl 433.68 KB
A Added · data
kv_cache.py 1.49 KB
A Added · src/llamafactory/model/model_utils
v1_sft_demo.yaml 170 B
A Added · data
liger_kernel.py 4.43 KB
A Added · src/llamafactory/model/model_utils
wiki_demo.txt 1004.22 KB
A Added · data
longlora.py 15.74 KB
A Added · src/llamafactory/model/model_utils
docker
A Added · .
misc.py 3.44 KB
A Added · src/llamafactory/model/model_utils
docker-cuda
A Added · docker
mod.py 1.39 KB
A Added · src/llamafactory/model/model_utils
docker-compose.yml 541 B
A Added · docker/docker-cuda
moe.py 9.49 KB
A Added · src/llamafactory/model/model_utils
Dockerfile 1.7 KB
A Added · docker/docker-cuda
packing.py 4.08 KB
A Added · src/llamafactory/model/model_utils
Dockerfile.base 2.22 KB
A Added · docker/docker-cuda
quantization.py 9.85 KB
A Added · src/llamafactory/model/model_utils
Dockerfile.megatron 2.87 KB
A Added · docker/docker-cuda
rope.py 3.3 KB
A Added · src/llamafactory/model/model_utils
README.md 3.04 KB
A Added · docker/docker-cuda
unsloth.py 3.69 KB
A Added · src/llamafactory/model/model_utils
docker-npu
A Added · docker
valuehead.py 2.71 KB
A Added · src/llamafactory/model/model_utils
docker-compose.yml 1.55 KB
A Added · docker/docker-npu
visual.py 12.24 KB
A Added · src/llamafactory/model/model_utils
Dockerfile 1.65 KB
A Added · docker/docker-npu
patcher.py 12.13 KB
A Added · src/llamafactory/model
docker-rocm
A Added · docker
third_party
A Added · src/llamafactory
docker-compose.yml 450 B
A Added · docker/docker-rocm
__init__.py 0 B
A Added · src/llamafactory/third_party
Dockerfile 2.04 KB
A Added · docker/docker-rocm
muon
A Added · src/llamafactory/third_party
examples
A Added · .
__init__.py 631 B
A Added · src/llamafactory/third_party/muon
accelerate
A Added · examples
muon.py 8.94 KB
A Added · src/llamafactory/third_party/muon
fsdp_config_multiple_nodes.yaml 1.29 KB
A Added · examples/accelerate
train
A Added · src/llamafactory
fsdp_config_offload.yaml 743 B
A Added · examples/accelerate
__init__.py 0 B
A Added · src/llamafactory/train
fsdp_config.yaml 707 B
A Added · examples/accelerate
callbacks.py 15.87 KB
A Added · src/llamafactory/train
fsdp2_config.yaml 592 B
A Added · examples/accelerate
dpo
A Added · src/llamafactory/train
ascend
A Added · examples
__init__.py 641 B
A Added · src/llamafactory/train/dpo
qwen3_full_sft_fsdp2.yaml 990 B
A Added · examples/ascend
ktrainer.py 2.66 KB
A Added · src/llamafactory/train/dpo
qwen3moe_full_sft_fsdp.yaml 1.03 KB
A Added · examples/ascend
trainer.py 15.13 KB
A Added · src/llamafactory/train/dpo
qwen3vlmoe_full_sft_fsdp2.yaml 1.1 KB
A Added · examples/ascend
workflow.py 4.52 KB
A Added · src/llamafactory/train/dpo
qwen3vlmoe_lora_sft_fsdp.yaml 972 B
A Added · examples/ascend
fp8_utils.py 8.81 KB
A Added · src/llamafactory/train
deepspeed
A Added · examples
kto
A Added · src/llamafactory/train
ds_z0_config.json 665 B
A Added · examples/deepspeed
__init__.py 641 B
A Added · src/llamafactory/train/kto
ds_z2_autotp_config.json 835 B
A Added · examples/deepspeed
trainer.py 13.21 KB
A Added · src/llamafactory/train/kto
ds_z2_config.json 665 B
A Added · examples/deepspeed
workflow.py 3.9 KB
A Added · src/llamafactory/train/kto
ds_z2_offload_config.json 747 B
A Added · examples/deepspeed
mca
A Added · src/llamafactory/train
ds_z3_config.json 789 B
A Added · examples/deepspeed
__init__.py 679 B
A Added · src/llamafactory/train/mca
ds_z3_fp8_config.json 1.08 KB
A Added · examples/deepspeed
trainer.py 624 B
A Added · src/llamafactory/train/mca
ds_z3_offload_config.json 949 B
A Added · examples/deepspeed
workflow.py 11.04 KB
A Added · src/llamafactory/train/mca
extras
A Added · examples
ppo
A Added · src/llamafactory/train
adam_mini
A Added · examples/extras
__init__.py 641 B
A Added · src/llamafactory/train/ppo
qwen2_full_sft.yaml 849 B
A Added · examples/extras/adam_mini
ppo_utils.py 3.27 KB
A Added · src/llamafactory/train/ppo
apollo
A Added · examples/extras
trainer.py 23.23 KB
A Added · src/llamafactory/train/ppo
llama3_full_sft.yaml 1.03 KB
A Added · examples/extras/apollo
workflow.py 3.31 KB
A Added · src/llamafactory/train/ppo
badam
A Added · examples/extras
pt
A Added · src/llamafactory/train
llama3_full_sft.yaml 963 B
A Added · examples/extras/badam
__init__.py 639 B
A Added · src/llamafactory/train/pt
dft
A Added · examples/extras
trainer.py 3.57 KB
A Added · src/llamafactory/train/pt
qwen2_full_sft.yaml 848 B
A Added · examples/extras/dft
workflow.py 3.78 KB
A Added · src/llamafactory/train/pt
eaft
A Added · examples/extras
rm
A Added · src/llamafactory/train
qwen25_05b_eaft_full.yaml 753 B
A Added · examples/extras/eaft
__init__.py 639 B
A Added · src/llamafactory/train/rm
fp8
A Added · examples/extras
metric.py 1.7 KB
A Added · src/llamafactory/train/rm
llama3_fp8_deepspeed_sft.yaml 1.15 KB
A Added · examples/extras/fp8
trainer.py 5.5 KB
A Added · src/llamafactory/train/rm
llama3_fp8_fsdp_sft.yaml 1.24 KB
A Added · examples/extras/fp8
workflow.py 3.93 KB
A Added · src/llamafactory/train/rm
fsdp_qlora
A Added · examples/extras
sft
A Added · src/llamafactory/train
llama3_lora_sft.yaml 891 B
A Added · examples/extras/fsdp_qlora
__init__.py 641 B
A Added · src/llamafactory/train/sft
train.sh 222 B
A Added · examples/extras/fsdp_qlora
metric.py 4.86 KB
A Added · src/llamafactory/train/sft
galore
A Added · examples/extras
trainer.py 7.54 KB
A Added · src/llamafactory/train/sft
llama3_full_sft.yaml 1 KB
A Added · examples/extras/galore
workflow.py 7.44 KB
A Added · src/llamafactory/train/sft
llama_pro
A Added · examples/extras
test_utils.py 4.68 KB
A Added · src/llamafactory/train
expand.sh 165 B
A Added · examples/extras/llama_pro
trainer_utils.py 33.7 KB
A Added · src/llamafactory/train
llama3_freeze_sft.yaml 911 B
A Added · examples/extras/llama_pro
tuner.py 9.03 KB
A Added · src/llamafactory/train
loraplus
A Added · examples/extras
v1
A Added · src/llamafactory
llama3_lora_sft.yaml 895 B
A Added · examples/extras/loraplus
__init__.py 0 B
A Added · src/llamafactory/v1
mod
A Added · examples/extras
accelerator
A Added · src/llamafactory/v1
llama3_full_sft.yaml 901 B
A Added · examples/extras/mod
__init__.py 0 B
A Added · src/llamafactory/v1/accelerator
multi_tokens
A Added · examples/extras
helper.py 6.65 KB
A Added · src/llamafactory/v1/accelerator
tokens_cfg.yaml 1.06 KB
A Added · examples/extras/multi_tokens
interface.py 9.16 KB
A Added · src/llamafactory/v1/accelerator
muon
A Added · examples/extras
profiler.py 0 B
A Added · src/llamafactory/v1/accelerator
qwen2_full_sft.yaml 844 B
A Added · examples/extras/muon
config
A Added · src/llamafactory/v1
nlg_eval
A Added · examples/extras
__init__.py 1.05 KB
A Added · src/llamafactory/v1/config
llama3_lora_predict.yaml 745 B
A Added · examples/extras/nlg_eval
arg_parser.py 2.58 KB
A Added · src/llamafactory/v1/config
oft
A Added · examples/extras
arg_utils.py 2.74 KB
A Added · src/llamafactory/v1/config
llama3_oft_sft.yaml 934 B
A Added · examples/extras/oft
data_args.py 918 B
A Added · src/llamafactory/v1/config
qwen2_5vl_oft_sft.yaml 985 B
A Added · examples/extras/oft
model_args.py 2.11 KB
A Added · src/llamafactory/v1/config
pissa
A Added · examples/extras
sample_args.py 983 B
A Added · src/llamafactory/v1/config
init.sh 147 B
A Added · examples/extras/pissa
training_args.py 2.88 KB
A Added · src/llamafactory/v1/config
llama3_lora_sft.yaml 923 B
A Added · examples/extras/pissa
core
A Added · src/llamafactory/v1
qoft
A Added · examples/extras
__init__.py 0 B
A Added · src/llamafactory/v1/core
llama3_oft_sft_awq.yaml 878 B
A Added · examples/extras/qoft
base_sampler.py 2.04 KB
A Added · src/llamafactory/v1/core
llama3_oft_sft_bnb_npu.yaml 946 B
A Added · examples/extras/qoft
base_trainer.py 6.71 KB
A Added · src/llamafactory/v1/core
llama3_oft_sft_gptq.yaml 879 B
A Added · examples/extras/qoft
data_engine.py 7.25 KB
A Added · src/llamafactory/v1/core
inference
A Added · examples
model_engine.py 5.36 KB
A Added · src/llamafactory/v1/core
qwen3_full_sft.yaml 174 B
A Added · examples/inference
utils
A Added · src/llamafactory/v1/core
qwen3_lora_sft.yaml 224 B
A Added · examples/inference
__init__.py 0 B
A Added · src/llamafactory/v1/core/utils
qwen3.yaml 178 B
A Added · examples/inference
batching.py 8.64 KB
A Added · src/llamafactory/v1/core/utils
qwen3vl.yaml 179 B
A Added · examples/inference
callback.py 0 B
A Added · src/llamafactory/v1/core/utils
ktransformers
A Added · examples
inference_engine.py 3.69 KB
A Added · src/llamafactory/v1/core/utils
infer_lora
A Added · examples/ktransformers
rendering.py 6.48 KB
A Added · src/llamafactory/v1/core/utils
deepseek2_lora_sft_kt.yaml 414 B
A Added · examples/ktransformers/infer_lora
launcher.py 1.8 KB
A Added · src/llamafactory/v1
deepseek3_kt.yaml 380 B
A Added · examples/ktransformers/infer_lora
plugins
A Added · src/llamafactory/v1
deepseek3_lora_sft_kt.yaml 426 B
A Added · examples/ktransformers/infer_lora
__init__.py 0 B
A Added · src/llamafactory/v1/plugins
qwen3moe_lora_sft_kt.yaml 419 B
A Added · examples/ktransformers/infer_lora
data_plugins
A Added · src/llamafactory/v1/plugins
kt_optimize_rules
A Added · examples/ktransformers
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/data_plugins
DeepSeek-V2-Chat-sft-amx.yaml 2.23 KB
A Added · examples/ktransformers/kt_optimize_rules
converter.py 6.88 KB
A Added · src/llamafactory/v1/plugins/data_plugins
DeepSeek-V2-Chat.yaml 2.17 KB
A Added · examples/ktransformers/kt_optimize_rules
loader.py 3.6 KB
A Added · src/llamafactory/v1/plugins/data_plugins
DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml 4.45 KB
A Added · examples/ktransformers/kt_optimize_rules
model_plugins
A Added · src/llamafactory/v1/plugins
DeepSeek-V2-Lite-Chat-sft-amx.yaml 2.23 KB
A Added · examples/ktransformers/kt_optimize_rules
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins
DeepSeek-V2-Lite-Chat-sft.yaml 2.17 KB
A Added · examples/ktransformers/kt_optimize_rules
add_token.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins
DeepSeek-V2-Lite-Chat.yaml 2.17 KB
A Added · examples/ktransformers/kt_optimize_rules
initialization.py 1.31 KB
A Added · src/llamafactory/v1/plugins/model_plugins
DeepSeek-V3-Chat-amx.yaml 2.65 KB
A Added · examples/ktransformers/kt_optimize_rules
kernels
A Added · src/llamafactory/v1/plugins/model_plugins
DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml 10.93 KB
A Added · examples/ktransformers/kt_optimize_rules
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins/kernels
DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml 5.09 KB
A Added · examples/ktransformers/kt_optimize_rules
base.py 2.99 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels
DeepSeek-V3-Chat-sft-amx.yaml 2.65 KB
A Added · examples/ktransformers/kt_optimize_rules
interface.py 4.19 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels
Qwen3Moe-sft-amx.yaml 2.67 KB
A Added · examples/ktransformers/kt_optimize_rules
ops
A Added · src/llamafactory/v1/plugins/model_plugins/kernels
train_lora
A Added · examples/ktransformers
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops
deepseek2_lora_sft_kt.yaml 1.1 KB
A Added · examples/ktransformers/train_lora
mlp
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops
deepseek3_lora_sft_kt.yaml 1.11 KB
A Added · examples/ktransformers/train_lora
__init__.py 0 B
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/mlp
qwen3moe_lora_sft_kt.yaml 1.1 KB
A Added · examples/ktransformers/train_lora
npu_fused_moe.py 12.12 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/mlp
megatron
A Added · examples
npu_swiglu.py 4.99 KB
A Added · src/llamafactory/v1/plugins/model_plugins/kernels/ops/mlp
Quick Actions
Commit Information
Hash:
9988a287da05
Commit ID:
81
Created:
2026-01-23 05:43:11
Age:
Jan 23, 2026
Repository:
llamafactory
Total Files:
551
Download Options