Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
694 commits
Select commit Hold shift + click to select a range
515cf5a
Update rl_replacements.py
danielhanchen Feb 20, 2025
2cf4349
Update rl.py
danielhanchen Feb 20, 2025
ae8bf68
Update rl.py
danielhanchen Feb 20, 2025
e07f4bc
Update rl.py
danielhanchen Feb 20, 2025
f11e5ab
Merge branch 'main' into nightly
danielhanchen Feb 20, 2025
3fccf5d
Update rl.py
danielhanchen Feb 20, 2025
798ad95
fix an import error (#1767)
NinoRisteski Feb 20, 2025
2957d89
SamplingParams
danielhanchen Feb 20, 2025
19d57bc
Convert mask to float (#1762)
Erland366 Feb 20, 2025
07aea40
[Windows Support] Add latest `xformers` wheels to pyproject.toml (#1753)
versipellis Feb 20, 2025
77109a4
Merge branch 'nightly' of https://github.com/unslothai/unsloth into n…
danielhanchen Feb 20, 2025
f3d9efb
vLLMSamplingParams
danielhanchen Feb 20, 2025
6d5caca
Update __init__.py
danielhanchen Feb 20, 2025
3a5610e
default num_chunks == -1
danielhanchen Feb 20, 2025
0362bd2
Versioning
danielhanchen Feb 20, 2025
2969db8
Merge branch 'main' into nightly
danielhanchen Feb 20, 2025
b5eda24
Update llama.py
danielhanchen Feb 20, 2025
7de0022
Update llama.py
danielhanchen Feb 20, 2025
d4d7694
Update llama.py
danielhanchen Feb 20, 2025
0bbfbe8
Update llama.py
danielhanchen Feb 20, 2025
ae6e2bd
Update llama.py
danielhanchen Feb 20, 2025
1792deb
Update _utils.py
danielhanchen Feb 20, 2025
5dcd079
Update rl_replacements.py
danielhanchen Feb 20, 2025
ec6e0b7
Update rl_replacements.py
danielhanchen Feb 20, 2025
bc1d2ce
Update pyproject.toml
danielhanchen Feb 20, 2025
adbe38e
Update pyproject.toml
danielhanchen Feb 20, 2025
a9b542f
Export Model to ollama.com (#1648)
gjyotin305 Feb 22, 2025
f853ac0
Merge branch 'main' into nightly
danielhanchen Mar 3, 2025
9cab347
Update cross_entropy_loss.py
danielhanchen Mar 3, 2025
0ae9082
torch_cuda_device
danielhanchen Mar 3, 2025
f21314c
Update utils.py
danielhanchen Mar 3, 2025
9215212
Update utils.py
danielhanchen Mar 3, 2025
9d95aee
Update utils.py
danielhanchen Mar 3, 2025
35e9144
device
danielhanchen Mar 3, 2025
30b6f94
device
danielhanchen Mar 3, 2025
64e2b00
Update loader.py
danielhanchen Mar 3, 2025
ffa3278
Update llama.py
danielhanchen Mar 3, 2025
748c5b5
Update README.md
danielhanchen Mar 3, 2025
469ed48
Update llama.py
danielhanchen Mar 3, 2025
bc87afd
Update llama.py
danielhanchen Mar 3, 2025
ee9d6e5
Update _utils.py
danielhanchen Mar 4, 2025
91458bb
Update utils.py
danielhanchen Mar 4, 2025
a7a5d75
Update utils.py
danielhanchen Mar 4, 2025
d93cca2
Update utils.py
danielhanchen Mar 4, 2025
6e2a3a8
Update utils.py
danielhanchen Mar 4, 2025
8f9ba99
Update utils.py
danielhanchen Mar 4, 2025
ed697da
Update llama.py
danielhanchen Mar 4, 2025
d73c34b
Update llama.py
danielhanchen Mar 4, 2025
4485da7
Update llama.py
danielhanchen Mar 4, 2025
45ea48c
Update llama.py
danielhanchen Mar 4, 2025
8c4b79c
Update llama.py
danielhanchen Mar 4, 2025
c2ae510
Update utils.py
danielhanchen Mar 4, 2025
432ea24
Update utils.py
danielhanchen Mar 4, 2025
dcff03c
Update utils.py
danielhanchen Mar 4, 2025
6ef0866
Update utils.py
danielhanchen Mar 4, 2025
8c8ce96
__version__
danielhanchen Mar 4, 2025
208971b
Update rl.py
danielhanchen Mar 4, 2025
adc6977
Bug fixes
danielhanchen Mar 4, 2025
949c298
Bug fixes
danielhanchen Mar 4, 2025
ad6d962
Merge branch 'main' into nightly
danielhanchen Mar 4, 2025
59b24ad
Update llama.py
danielhanchen Mar 5, 2025
5df3936
Update _utils.py
danielhanchen Mar 5, 2025
b8b0f9c
_wrap_fast_inference
danielhanchen Mar 5, 2025
6f0857b
Update llama.py
danielhanchen Mar 5, 2025
109364b
Update llama.py
danielhanchen Mar 5, 2025
dd4bd07
Update llama.py
danielhanchen Mar 5, 2025
b356fce
Update llama.py
danielhanchen Mar 5, 2025
e022016
Update llama.py
danielhanchen Mar 5, 2025
12094a7
Update llama.py
danielhanchen Mar 5, 2025
2836128
Update llama.py
danielhanchen Mar 5, 2025
c956616
Update llama.py
danielhanchen Mar 5, 2025
e887f43
Update llama.py
danielhanchen Mar 5, 2025
95f872d
Update llama.py
danielhanchen Mar 5, 2025
647dbb4
Update llama.py
danielhanchen Mar 5, 2025
f640c8d
Update _utils.py
danielhanchen Mar 5, 2025
91a4fce
SFT dataset prepare
danielhanchen Mar 5, 2025
4495148
Update pyproject.toml
danielhanchen Mar 5, 2025
f41dff5
Update rl_replacements.py
danielhanchen Mar 5, 2025
0a3dbfa
Update rl_replacements.py
danielhanchen Mar 5, 2025
7d8f100
Update rl_replacements.py
danielhanchen Mar 5, 2025
413ea80
Update rl.py
danielhanchen Mar 5, 2025
3f5ce93
Update llama.py
danielhanchen Mar 5, 2025
185bced
Update llama.py
danielhanchen Mar 5, 2025
fd11ad7
Update utils.py
danielhanchen Mar 5, 2025
97ed0b4
bug fix
danielhanchen Mar 5, 2025
68eca88
Update llama.py
danielhanchen Mar 5, 2025
5daf9b5
Update llama.py
danielhanchen Mar 5, 2025
858bb76
Update llama.py
danielhanchen Mar 5, 2025
daedc34
Update llama.py
danielhanchen Mar 5, 2025
95e2371
Update llama.py
danielhanchen Mar 5, 2025
fccd68a
Update __init__.py
danielhanchen Mar 5, 2025
c665e0b
Update _utils.py
danielhanchen Mar 6, 2025
d207daf
Merge branch 'main' into nightly
danielhanchen Mar 6, 2025
dbf7eac
Update _utils.py
danielhanchen Mar 6, 2025
b55f6d9
Update _utils.py
danielhanchen Mar 6, 2025
c7abf7d
Update _utils.py
danielhanchen Mar 6, 2025
98d5ab0
Update _utils.py
danielhanchen Mar 6, 2025
f72794e
Update rl.py
danielhanchen Mar 6, 2025
1ec0ee2
Update rl.py
danielhanchen Mar 6, 2025
5350c6a
Update rl.py
danielhanchen Mar 6, 2025
9009ef0
Update _utils.py
danielhanchen Mar 6, 2025
7f7899d
Update __init__.py
danielhanchen Mar 6, 2025
334bd77
Update _utils.py
danielhanchen Mar 6, 2025
ade31e2
Version
danielhanchen Mar 6, 2025
a31e45b
Merge branch 'main' into nightly
danielhanchen Mar 6, 2025
8015ff2
versioning
danielhanchen Mar 6, 2025
d8777be
Update _utils.py
danielhanchen Mar 6, 2025
132b838
Update llama.py
danielhanchen Mar 6, 2025
21faa50
Update llama.py
danielhanchen Mar 6, 2025
af5d875
Merge branch 'main' into nightly
danielhanchen Mar 6, 2025
904e1c5
Bug fixes
danielhanchen Mar 7, 2025
761bb8f
FastModel
danielhanchen Mar 8, 2025
7bf880f
__doc__
danielhanchen Mar 8, 2025
c93b51b
Update vision.py
danielhanchen Mar 8, 2025
f8867be
Update loader.py
danielhanchen Mar 8, 2025
2ab1828
Update loader.py
danielhanchen Mar 8, 2025
e05baed
Update loader.py
danielhanchen Mar 8, 2025
31012a7
version
danielhanchen Mar 8, 2025
a8bf659
Merge branch 'main' into nightly
danielhanchen Mar 9, 2025
d72e3e0
move use_modelscope to _utils (#1938)
KareemMusleh Mar 9, 2025
7e82339
Don't use revision when loading model_config and is_peft=True (#1949)
wiwu2390 Mar 9, 2025
4904c48
More syntax warnings (#1944)
KareemMusleh Mar 9, 2025
7aaa605
Update loader.py
danielhanchen Mar 9, 2025
a585536
Full finetuning and other fixes
danielhanchen Mar 10, 2025
133c0ae
UNSLOTH_ENABLE_FULL_FINETUNING
danielhanchen Mar 10, 2025
9d5aa5c
Update loader.py
danielhanchen Mar 10, 2025
934ad16
Update loader.py
danielhanchen Mar 10, 2025
76f2f2a
Update loader.py
danielhanchen Mar 10, 2025
f763ed6
Update vision.py
danielhanchen Mar 10, 2025
0df9518
Update vision.py
danielhanchen Mar 10, 2025
ced164e
full finetuning
danielhanchen Mar 10, 2025
5b45f0f
Update loader.py
danielhanchen Mar 10, 2025
23d45cf
Update loader.py
danielhanchen Mar 10, 2025
bdebea7
Update loader.py
danielhanchen Mar 10, 2025
04f1abc
Update _utils.py
danielhanchen Mar 10, 2025
4c0a8d6
max_seq_length
danielhanchen Mar 10, 2025
8f16ce0
Update rl.py
danielhanchen Mar 10, 2025
8b16a16
Update rl.py
danielhanchen Mar 10, 2025
a8c96d3
Update rl.py
danielhanchen Mar 10, 2025
739b1dd
Update pyproject.toml
danielhanchen Mar 11, 2025
c555388
AutoModelForImageTextToText
danielhanchen Mar 11, 2025
77fec99
Update mapper.py
danielhanchen Mar 11, 2025
c539fc6
Update pyproject.toml
danielhanchen Mar 11, 2025
3ddcf84
Update _utils.py
danielhanchen Mar 11, 2025
3aa2d95
Update _utils.py
danielhanchen Mar 11, 2025
a3541c0
Update _utils.py
danielhanchen Mar 11, 2025
a4faf0f
Batch samples
danielhanchen Mar 12, 2025
eb0add4
Update loader.py
danielhanchen Mar 12, 2025
b556785
Update loader.py
danielhanchen Mar 12, 2025
ead1b3b
Update loader.py
danielhanchen Mar 12, 2025
b388d8d
Update loader.py
danielhanchen Mar 12, 2025
80eac80
Update _utils.py
danielhanchen Mar 12, 2025
d6d862e
Update loader.py
danielhanchen Mar 12, 2025
ea6aae6
Update vision.py
danielhanchen Mar 12, 2025
0c4ebb3
Update loader.py
danielhanchen Mar 12, 2025
528e8f0
Update vision.py
danielhanchen Mar 12, 2025
152b376
Update vision.py
danielhanchen Mar 12, 2025
2fdeecd
Update vision.py
danielhanchen Mar 12, 2025
ceda772
Update mapper.py
danielhanchen Mar 12, 2025
0df6ad4
Merge branch 'main' into nightly
danielhanchen Mar 12, 2025
f386f0f
Update vision.py
danielhanchen Mar 12, 2025
b6187c6
Temporary patches
danielhanchen Mar 13, 2025
bb59cec
Update loader.py
danielhanchen Mar 13, 2025
3326c4f
model names
danielhanchen Mar 13, 2025
bb193e4
Gemma 3 chat template
danielhanchen Mar 13, 2025
57a5442
Bug fixes
danielhanchen Mar 13, 2025
8457c75
Update vision.py
danielhanchen Mar 13, 2025
bc735a7
Update vision.py
danielhanchen Mar 13, 2025
ed588ee
Update vision.py
danielhanchen Mar 13, 2025
a3637fa
Update vision.py
danielhanchen Mar 13, 2025
6218eae
Update vision.py
danielhanchen Mar 13, 2025
9005a57
Update llama.py
danielhanchen Mar 13, 2025
97f40bd
Update llama.py
danielhanchen Mar 13, 2025
24cd9f7
Update rl.py
danielhanchen Mar 13, 2025
b0d9ee0
Update chat_templates.py
danielhanchen Mar 13, 2025
07f47a4
Update chat_templates.py
danielhanchen Mar 13, 2025
caec8ff
Update vision.py
danielhanchen Mar 13, 2025
c96eab5
Update vision.py
danielhanchen Mar 13, 2025
6e58d97
Update vision.py
danielhanchen Mar 13, 2025
dd17676
Update loader.py
danielhanchen Mar 13, 2025
7d0893b
Update vision.py
danielhanchen Mar 13, 2025
8b51a7d
Update vision.py
danielhanchen Mar 13, 2025
833e295
Revert
danielhanchen Mar 13, 2025
20ae25a
Update _utils.py
danielhanchen Mar 13, 2025
067fb5e
forced precision
danielhanchen Mar 13, 2025
7493af8
Autocast
danielhanchen Mar 13, 2025
6dcd0bf
Update vision.py
danielhanchen Mar 13, 2025
c6eae35
Update vision.py
danielhanchen Mar 13, 2025
d1f09cf
Update rl.py
danielhanchen Mar 13, 2025
e0e31d9
Update vision.py
danielhanchen Mar 13, 2025
57576a5
Update vision.py
danielhanchen Mar 13, 2025
3b6c379
Update vision.py
danielhanchen Mar 13, 2025
b284ed5
Update vision.py
danielhanchen Mar 13, 2025
ed80c07
Update vision.py
danielhanchen Mar 13, 2025
171ad42
Update rl.py
danielhanchen Mar 13, 2025
9f6d280
vLLM fixes
danielhanchen Mar 14, 2025
f525442
constexpr
danielhanchen Mar 14, 2025
6e7d5be
Update vision.py
danielhanchen Mar 14, 2025
e388265
Update vision.py
danielhanchen Mar 14, 2025
2def2a5
Update vision.py
danielhanchen Mar 14, 2025
69f4581
Update rl.py
danielhanchen Mar 14, 2025
13788ab
Update llama.py
danielhanchen Mar 14, 2025
7ccacc3
Update llama.py
danielhanchen Mar 14, 2025
a219029
Update llama.py
danielhanchen Mar 14, 2025
d9d1116
Update llama.py
danielhanchen Mar 14, 2025
050cb85
Update llama.py
danielhanchen Mar 14, 2025
ae54a69
Update llama.py
danielhanchen Mar 14, 2025
5a4f410
Update llama.py
danielhanchen Mar 14, 2025
c21dba4
Update llama.py
danielhanchen Mar 14, 2025
1f7f78e
Update _utils.py
danielhanchen Mar 14, 2025
edd6181
Update _utils.py
danielhanchen Mar 14, 2025
6547468
Update _utils.py
danielhanchen Mar 14, 2025
7afe411
Update _utils.py
danielhanchen Mar 14, 2025
13b4a95
Update save.py
danielhanchen Mar 14, 2025
2b76350
New models
danielhanchen Mar 14, 2025
1b45ab6
Triton windows update (#1976)
Captain-T2004 Mar 14, 2025
6aaf377
Update RMS LayerNorm implementation, and list compr. change in chat t…
NinoRisteski Mar 14, 2025
94f075c
Update Zoo
danielhanchen Mar 14, 2025
1d6c395
Merge branch 'nightly' of https://github.com/unslothai/unsloth into n…
danielhanchen Mar 14, 2025
8ec6e8b
Merge branch 'main' into nightly
danielhanchen Mar 14, 2025
4ef899c
Update llama.py
danielhanchen Mar 14, 2025
9cd4f47
Update llama.py
danielhanchen Mar 14, 2025
5e17f22
Update vision.py
danielhanchen Mar 14, 2025
0003ead
Update vision.py
danielhanchen Mar 14, 2025
8f455fc
Update vision.py
danielhanchen Mar 14, 2025
790833e
Update vision.py
danielhanchen Mar 14, 2025
ba8408d
Update vision.py
danielhanchen Mar 14, 2025
e78fe39
Update vision.py
danielhanchen Mar 14, 2025
6b5eb3c
Update vision.py
danielhanchen Mar 14, 2025
9703843
Update vision.py
danielhanchen Mar 14, 2025
f6efd4d
Update vision.py
danielhanchen Mar 14, 2025
9bc273b
Update vision.py
danielhanchen Mar 14, 2025
26045d8
Update vision.py
danielhanchen Mar 14, 2025
f988ed4
Update vision.py
danielhanchen Mar 14, 2025
5d98f5b
Update rl_replacements.py
danielhanchen Mar 14, 2025
4079dba
Update vision.py
danielhanchen Mar 14, 2025
9554dd5
grpo fix
danielhanchen Mar 14, 2025
3a76607
Update rl_replacements.py
danielhanchen Mar 14, 2025
1d73f9e
Update vision.py
danielhanchen Mar 14, 2025
35383c3
Update rl_replacements.py
danielhanchen Mar 14, 2025
fc74d92
Update vision.py
danielhanchen Mar 14, 2025
3ac4fa5
Update mapper.py
danielhanchen Mar 14, 2025
b75698c
Update vision.py
danielhanchen Mar 14, 2025
87363a6
Update vision.py
danielhanchen Mar 14, 2025
1a17945
Update loader.py
danielhanchen Mar 14, 2025
e72a79a
Merge branch 'main' into nightly
danielhanchen Mar 14, 2025
21867b7
Update vision.py
danielhanchen Mar 14, 2025
a6e86f4
Update save.py
danielhanchen Mar 14, 2025
b9de6dc
Update save.py
danielhanchen Mar 14, 2025
3c3d9b3
Update save.py
danielhanchen Mar 14, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion unsloth/models/vision.py
Original file line number Diff line number Diff line change
Expand Up @@ -485,7 +485,7 @@ def post_patch_model(
full_finetuning = os.environ.get("UNSLOTH_ENABLE_FULL_FINETUNING", "0") == "1"

float32_mixed_precision = True
if _get_dtype(model.config.torch_dtype) == torch.bfloat16:
if _get_dtype(model.config.torch_dtype) == torch.bfloat16 and full_finetuning:
# Use bfloat16 precision for full finetuning
float32_mixed_precision = False

Expand Down
56 changes: 52 additions & 4 deletions unsloth/save.py
Original file line number Diff line number Diff line change
Expand Up @@ -2218,12 +2218,60 @@ def unsloth_convert_lora_to_ggml_and_save_locally(


from .models.loader_utils import get_model_name
from unsloth_zoo.saving_utils import merge_and_overwrite_lora
from unsloth_zoo.saving_utils import (
merge_and_overwrite_lora,
prepare_saving,
)
from unsloth_zoo.llama_cpp import (
install_llama_cpp,
convert_to_gguf,
convert_to_gguf as _convert_to_gguf,
)

@torch.inference_mode
def save_to_gguf_generic(
model,
save_directory,
quantization_type = "Q8_0",
repo_id = None,
token = None,
):
if token is None and repo_id is not None: token = get_token()
if repo_id is not None and token is None:
raise RuntimeError("Unsloth: Please specify a token for uploading!")

if not os.path.exists(os.path.join("llama.cpp", "unsloth_convert_hf_to_gguf.py")):
install_llama_cpp(just_clone_repo = True)
pass

metadata = _convert_to_gguf(
save_directory,
print_output = True,
quantization_type = quantization_type,
)
if repo_id is not None:
prepare_saving(
model,
repo_id,
push_to_hub = True,
max_shard_size = "50GB",
private = True,
token = token,
)

from huggingface_hub import HfApi
api = HfApi(token = token)
api.upload_folder(
folder_path = save_directory,
repo_id = repo_id,
repo_type = "model",
allow_patterns = ["*.gguf"],
private = True,
)
pass
return metadata
pass


@torch.inference_mode
def unsloth_generic_save(
model,
Expand Down Expand Up @@ -2467,8 +2515,8 @@ def patch_saving_functions(model, vision = False):
# Vision only 1 option
model.push_to_hub_merged = types.MethodType(unsloth_generic_push_to_hub_merged, model)
model.save_pretrained_merged = types.MethodType(unsloth_generic_save_pretrained_merged, model)
model.push_to_hub_gguf = types.MethodType(not_implemented_save, model)
model.save_pretrained_gguf = types.MethodType(not_implemented_save, model)
model.push_to_hub_gguf = types.MethodType(save_to_gguf_generic, model)
model.save_pretrained_gguf = types.MethodType(save_to_gguf_generic, model)
pass
return model
pass