Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
470 commits
Select commit Hold shift + click to select a range
15073c0
Update rl.py
danielhanchen Feb 11, 2025
0c54b1e
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
a820ac6
Auto patching
danielhanchen Feb 11, 2025
15c5220
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
92a9f0b
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
61b1853
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
ea8739d
Update rl.py
danielhanchen Feb 11, 2025
61699bf
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
acbf23f
Update rl.py
danielhanchen Feb 11, 2025
b1b9af3
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
fee37b0
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
ff27094
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
6ab51be
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
b45f633
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
fd9e677
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
b9b3166
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
7fdab17
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
2595971
Update rl.py
danielhanchen Feb 11, 2025
f470f55
Update rl.py
danielhanchen Feb 11, 2025
ddfdca1
Update rl.py
danielhanchen Feb 11, 2025
3e0c7e2
Update rl.py
danielhanchen Feb 11, 2025
ae3f219
Update rl.py
danielhanchen Feb 11, 2025
5e71435
Update rl.py
danielhanchen Feb 11, 2025
883192d
Update rl.py
danielhanchen Feb 11, 2025
22c1cc1
Update rl.py
danielhanchen Feb 11, 2025
3fabc11
Update rl.py
danielhanchen Feb 11, 2025
d9687d5
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
4737380
Update rl.py
danielhanchen Feb 11, 2025
6abf22a
Update rl.py
danielhanchen Feb 11, 2025
5edcdf8
Update rl.py
danielhanchen Feb 11, 2025
7e55aef
max seq length
danielhanchen Feb 11, 2025
6a21b50
Update rl.py
danielhanchen Feb 11, 2025
035d24e
Update rl.py
danielhanchen Feb 11, 2025
b67327b
Patching
danielhanchen Feb 11, 2025
56bf7a1
Update rl.py
danielhanchen Feb 11, 2025
8c23657
Update rl.py
danielhanchen Feb 11, 2025
e735ab5
Update rl.py
danielhanchen Feb 12, 2025
484afd7
Update rl.py
danielhanchen Feb 12, 2025
4a23920
Update rl.py
danielhanchen Feb 12, 2025
19b16bb
NEFTune
danielhanchen Feb 12, 2025
7e19c0f
Update rl.py
danielhanchen Feb 12, 2025
0ac3d15
Update rl.py
danielhanchen Feb 12, 2025
70b341c
Update rl.py
danielhanchen Feb 12, 2025
3b641de
Update rl.py
danielhanchen Feb 12, 2025
30ad4c4
Update rl.py
danielhanchen Feb 12, 2025
a848c01
Update rl.py
danielhanchen Feb 12, 2025
f25abe6
Update rl.py
danielhanchen Feb 12, 2025
0694463
Extra replacements
danielhanchen Feb 12, 2025
8cc0338
Update rl_replacements.py
danielhanchen Feb 12, 2025
a145a83
Update rl.py
danielhanchen Feb 12, 2025
39fbcfb
extra RL replacements
danielhanchen Feb 12, 2025
2e68bb3
Update rl_replacements.py
danielhanchen Feb 12, 2025
82d3f6a
Update rl_replacements.py
danielhanchen Feb 12, 2025
0c691cf
Update rl_replacements.py
danielhanchen Feb 12, 2025
cd6f9b6
Update rl_replacements.py
danielhanchen Feb 12, 2025
be568b0
Update rl_replacements.py
danielhanchen Feb 12, 2025
94e8298
Merge branch 'main' into nightly
danielhanchen Feb 12, 2025
9ade782
Update rl_replacements.py
danielhanchen Feb 12, 2025
e498150
Update llama.py
danielhanchen Feb 12, 2025
2a5aa3d
Update rl_replacements.py
danielhanchen Feb 12, 2025
2524538
Update _utils.py
danielhanchen Feb 12, 2025
c9ba000
Update loader_utils.py
danielhanchen Feb 12, 2025
5b2fd72
Update rl.py
danielhanchen Feb 12, 2025
3466186
Update rl_replacements.py
danielhanchen Feb 12, 2025
5dc8847
Update rl_replacements.py
danielhanchen Feb 12, 2025
9aad48e
Update rl.py
danielhanchen Feb 12, 2025
f121a5c
Update llama.py
danielhanchen Feb 12, 2025
5052d35
Update llama.py
danielhanchen Feb 12, 2025
a11aa96
Update llama.py
danielhanchen Feb 12, 2025
a6abe02
Update llama.py
danielhanchen Feb 12, 2025
d867faa
autocast
danielhanchen Feb 12, 2025
44c9228
Update rl_replacements.py
danielhanchen Feb 12, 2025
e83d854
Update llama.py
danielhanchen Feb 12, 2025
623eb65
Update rl_replacements.py
danielhanchen Feb 13, 2025
7e612f0
Update rl_replacements.py
danielhanchen Feb 13, 2025
a45266b
Update rl_replacements.py
danielhanchen Feb 13, 2025
c855d7e
Update rl_replacements.py
danielhanchen Feb 13, 2025
d7cefba
Update llama.py
danielhanchen Feb 13, 2025
52d996a
Update rl_replacements.py
danielhanchen Feb 13, 2025
56f5b31
Update llama.py
danielhanchen Feb 13, 2025
5f1e98c
Update llama.py
danielhanchen Feb 13, 2025
e713129
Update llama.py
danielhanchen Feb 13, 2025
310fc16
Update llama.py
danielhanchen Feb 13, 2025
76a122e
Update llama.py
danielhanchen Feb 13, 2025
2dd29e5
Update rl_replacements.py
danielhanchen Feb 13, 2025
3c5be91
Update llama.py
danielhanchen Feb 13, 2025
e548b15
Update llama.py
danielhanchen Feb 13, 2025
296b3b3
Update llama.py
danielhanchen Feb 13, 2025
8de588b
Update llama.py
danielhanchen Feb 13, 2025
f87909a
Update pyproject.toml
danielhanchen Feb 13, 2025
2704440
Update llama.py
danielhanchen Feb 13, 2025
42e1967
Update llama.py
danielhanchen Feb 13, 2025
36bf805
Update llama.py
danielhanchen Feb 13, 2025
a3af8e3
Update llama.py
danielhanchen Feb 13, 2025
9d10d2f
Update llama.py
danielhanchen Feb 13, 2025
b30a81f
Update llama.py
danielhanchen Feb 13, 2025
b7e8559
Update llama.py
danielhanchen Feb 13, 2025
4b201d9
Update rl_replacements.py
danielhanchen Feb 13, 2025
dc723bc
Update rl_replacements.py
danielhanchen Feb 13, 2025
0309949
Update rl_replacements.py
danielhanchen Feb 13, 2025
c409574
Update rl_replacements.py
danielhanchen Feb 13, 2025
8e5b09a
Update llama.py
danielhanchen Feb 13, 2025
6652f1d
Update rl_replacements.py
danielhanchen Feb 13, 2025
9215bbe
Update rl_replacements.py
danielhanchen Feb 13, 2025
4bff998
Update rl_replacements.py
danielhanchen Feb 13, 2025
c859030
Update rl_replacements.py
danielhanchen Feb 13, 2025
2daa8e3
Update rl_replacements.py
danielhanchen Feb 13, 2025
527a0c4
Update rl_replacements.py
danielhanchen Feb 13, 2025
087a5dc
Update rl_replacements.py
danielhanchen Feb 13, 2025
73210b3
Update rl_replacements.py
danielhanchen Feb 13, 2025
9934ac5
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
2635f2a
Update llama.py
danielhanchen Feb 13, 2025
69ab838
Update _utils.py
danielhanchen Feb 13, 2025
d5d7a06
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
c9e450f
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
44d00e8
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
447dfc4
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
acf98dc
Update llama.py
danielhanchen Feb 14, 2025
1399110
Update _utils.py
danielhanchen Feb 14, 2025
881105b
Update rl_replacements.py
danielhanchen Feb 14, 2025
cfdd3f1
Update rl.py
danielhanchen Feb 14, 2025
95b7df5
Update rl.py
danielhanchen Feb 14, 2025
17bfcf9
Update rl.py
danielhanchen Feb 14, 2025
61c219d
Update rl.py
danielhanchen Feb 14, 2025
9794dc2
Update rl.py
danielhanchen Feb 14, 2025
3687a6f
Update llama.py
danielhanchen Feb 14, 2025
c495bfa
Update llama.py
danielhanchen Feb 14, 2025
f9055a7
Update llama.py
danielhanchen Feb 14, 2025
945e3f9
Update llama.py
danielhanchen Feb 14, 2025
3d9fe12
Update rl_replacements.py
danielhanchen Feb 14, 2025
ed90785
Update llama.py
danielhanchen Feb 14, 2025
640bc88
Update llama.py
danielhanchen Feb 14, 2025
bb3bb2d
Update llama.py
danielhanchen Feb 14, 2025
9065938
Update llama.py
danielhanchen Feb 14, 2025
07b48f5
Merge branch 'main' into nightly
danielhanchen Feb 14, 2025
48c5e0d
GRPO optimized
danielhanchen Feb 14, 2025
3a1fb63
Update rl.py
danielhanchen Feb 14, 2025
19014b0
Update rl_replacements.py
danielhanchen Feb 14, 2025
0c17e79
Update rl_replacements.py
danielhanchen Feb 14, 2025
aee44e2
Update rl.py
danielhanchen Feb 14, 2025
953d957
Update rl.py
danielhanchen Feb 14, 2025
2a2b9f7
Update rl.py
danielhanchen Feb 14, 2025
fcb0f4a
Update rl.py
danielhanchen Feb 14, 2025
eabc365
Update rl_replacements.py
danielhanchen Feb 14, 2025
7408318
Update rl_replacements.py
danielhanchen Feb 14, 2025
f35eae3
Update rl_replacements.py
danielhanchen Feb 14, 2025
2b89dae
Selective Log softmax
danielhanchen Feb 14, 2025
45c8431
Fix GRPO bsz
danielhanchen Feb 14, 2025
644cedf
Update rl.py
danielhanchen Feb 14, 2025
4b765d7
Update rl_replacements.py
danielhanchen Feb 14, 2025
0a7c56d
Update rl_replacements.py
danielhanchen Feb 15, 2025
1b43e1d
Update rl_replacements.py
danielhanchen Feb 15, 2025
d588665
Update rl_replacements.py
danielhanchen Feb 15, 2025
54bd827
Fix TRL
danielhanchen Feb 15, 2025
c6d6e6b
Merge branch 'main' into nightly
danielhanchen Feb 15, 2025
fa560ce
Metrics GRPO
danielhanchen Feb 15, 2025
46462f1
Update rl_replacements.py
danielhanchen Feb 15, 2025
12c497a
Update rl_replacements.py
danielhanchen Feb 15, 2025
b8aca94
Merge branch 'main' into nightly
danielhanchen Feb 15, 2025
c14faee
No compile
danielhanchen Feb 16, 2025
1fcad32
Update rl.py
danielhanchen Feb 16, 2025
80be827
Remove docs
danielhanchen Feb 16, 2025
9254243
Update rl.py
danielhanchen Feb 16, 2025
09cb804
Update rl.py
danielhanchen Feb 16, 2025
86dabcf
Update rl.py
danielhanchen Feb 16, 2025
ba1c93e
Update rl.py
danielhanchen Feb 16, 2025
0d75afd
Update rl_replacements.py
danielhanchen Feb 16, 2025
1803658
Update rl.py
danielhanchen Feb 16, 2025
a856085
Update rl.py
danielhanchen Feb 16, 2025
eeac4f3
Update rl_replacements.py
danielhanchen Feb 16, 2025
6f1beb0
Update rl_replacements.py
danielhanchen Feb 16, 2025
222b1e7
llama-quantize on WINDOWS WSL error fix - edit save.py (gguf saving b…
everythingisc00l Feb 16, 2025
103cff4
Update rl_replacements.py
danielhanchen Feb 17, 2025
89a1d03
Update rl_replacements.py
danielhanchen Feb 17, 2025
c46b544
Update rl_replacements.py
danielhanchen Feb 17, 2025
ed84307
Update rl_replacements.py
danielhanchen Feb 17, 2025
93d3f16
Update rl_replacements.py
danielhanchen Feb 17, 2025
429ba6d
Update rl_replacements.py
danielhanchen Feb 17, 2025
1e42bad
Update rl_replacements.py
danielhanchen Feb 17, 2025
38a1885
Update rl_replacements.py
danielhanchen Feb 17, 2025
f0ee4f5
Update rl_replacements.py
danielhanchen Feb 17, 2025
b68dce6
Update rl_replacements.py
danielhanchen Feb 17, 2025
0827067
Update llama.py
danielhanchen Feb 17, 2025
204cd7a
Update rl_replacements.py
danielhanchen Feb 17, 2025
e141075
Update rl_replacements.py
danielhanchen Feb 17, 2025
a07a9e3
Update rl_replacements.py
danielhanchen Feb 17, 2025
cf2720d
Update llama.py
danielhanchen Feb 17, 2025
5c6f586
Update llama.py
danielhanchen Feb 18, 2025
2e07623
Update rl_replacements.py
danielhanchen Feb 18, 2025
8025cfe
Update rl_replacements.py
danielhanchen Feb 18, 2025
ba48495
Update rl_replacements.py
danielhanchen Feb 18, 2025
f0078de
Update rl.py
danielhanchen Feb 18, 2025
15e0140
Update rl.py
danielhanchen Feb 18, 2025
5f5cca4
Update rl_replacements.py
danielhanchen Feb 18, 2025
d80be70
Update rl.py
danielhanchen Feb 18, 2025
47a85eb
Update rl.py
danielhanchen Feb 18, 2025
f09478d
Update rl_replacements.py
danielhanchen Feb 18, 2025
97637c5
Update rl_replacements.py
danielhanchen Feb 18, 2025
58bd27f
Update rl_replacements.py
danielhanchen Feb 18, 2025
7c0c749
Update rl_replacements.py
danielhanchen Feb 18, 2025
97b55c1
Update rl_replacements.py
danielhanchen Feb 18, 2025
24c7a2f
Update rl_replacements.py
danielhanchen Feb 18, 2025
06b2cd3
unsloth_num_chunks
danielhanchen Feb 18, 2025
cbb16e3
Update rl.py
danielhanchen Feb 18, 2025
d16299b
Update rl_replacements.py
danielhanchen Feb 18, 2025
0c1a808
Update rl_replacements.py
danielhanchen Feb 18, 2025
6796801
Update rl_replacements.py
danielhanchen Feb 18, 2025
bd046ca
Update rl.py
danielhanchen Feb 18, 2025
ac2e814
Update rl.py
danielhanchen Feb 18, 2025
a88712f
Update rl.py
danielhanchen Feb 18, 2025
0daa328
Update rl.py
danielhanchen Feb 18, 2025
1afe3f2
Update rl.py
danielhanchen Feb 18, 2025
6732822
Update rl_replacements.py
danielhanchen Feb 18, 2025
5efe9f3
Update rl_replacements.py
danielhanchen Feb 18, 2025
15442d1
Update rl_replacements.py (#1754)
SethHWeidman Feb 19, 2025
91ab43d
Optional logits
danielhanchen Feb 19, 2025
a6a5f60
Update rl.py
danielhanchen Feb 19, 2025
83ce085
Update rl.py
danielhanchen Feb 19, 2025
8ece11f
Update rl.py
danielhanchen Feb 19, 2025
bc6bfae
Update rl.py
danielhanchen Feb 20, 2025
95fb6a4
Update rl.py
danielhanchen Feb 20, 2025
ba01cf5
Update rl.py
danielhanchen Feb 20, 2025
eb48b98
Update rl.py
danielhanchen Feb 20, 2025
3c750a1
Update rl.py
danielhanchen Feb 20, 2025
515cf5a
Update rl_replacements.py
danielhanchen Feb 20, 2025
2cf4349
Update rl.py
danielhanchen Feb 20, 2025
ae8bf68
Update rl.py
danielhanchen Feb 20, 2025
e07f4bc
Update rl.py
danielhanchen Feb 20, 2025
f11e5ab
Merge branch 'main' into nightly
danielhanchen Feb 20, 2025
3fccf5d
Update rl.py
danielhanchen Feb 20, 2025
798ad95
fix an import error (#1767)
NinoRisteski Feb 20, 2025
2957d89
SamplingParams
danielhanchen Feb 20, 2025
19d57bc
Convert mask to float (#1762)
Erland366 Feb 20, 2025
07aea40
[Windows Support] Add latest `xformers` wheels to pyproject.toml (#1753)
versipellis Feb 20, 2025
77109a4
Merge branch 'nightly' of https://github.com/unslothai/unsloth into n…
danielhanchen Feb 20, 2025
f3d9efb
vLLMSamplingParams
danielhanchen Feb 20, 2025
6d5caca
Update __init__.py
danielhanchen Feb 20, 2025
3a5610e
default num_chunks == -1
danielhanchen Feb 20, 2025
0362bd2
Versioning
danielhanchen Feb 20, 2025
2969db8
Merge branch 'main' into nightly
danielhanchen Feb 20, 2025
b5eda24
Update llama.py
danielhanchen Feb 20, 2025
7de0022
Update llama.py
danielhanchen Feb 20, 2025
d4d7694
Update llama.py
danielhanchen Feb 20, 2025
0bbfbe8
Update llama.py
danielhanchen Feb 20, 2025
ae6e2bd
Update llama.py
danielhanchen Feb 20, 2025
1792deb
Update _utils.py
danielhanchen Feb 20, 2025
5dcd079
Update rl_replacements.py
danielhanchen Feb 20, 2025
ec6e0b7
Update rl_replacements.py
danielhanchen Feb 20, 2025
bc1d2ce
Update pyproject.toml
danielhanchen Feb 20, 2025
adbe38e
Update pyproject.toml
danielhanchen Feb 20, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 4 additions & 4 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@ triton = [
"triton @ https://github.com/woct0rdho/triton-windows/releases/download/v3.1.0-windows.post5/triton-3.1.0-cp312-cp312-win_amd64.whl ; python_version=='3.12' and platform_system == 'Windows'",
]
huggingface = [
"unsloth_zoo>=2025.2.6",
"unsloth_zoo>=2025.2.7",
"packaging",
"tyro",
"transformers>=4.46.1,!=4.47.0",
Expand All @@ -50,7 +50,7 @@ huggingface = [
"wheel>=0.42.0",
"numpy",
"accelerate>=0.34.1",
"trl>=0.7.9,!=0.9.0,!=0.9.1,!=0.9.2,!=0.9.3",
"trl>=0.7.9,!=0.9.0,!=0.9.1,!=0.9.2,!=0.9.3,!=0.15.0",
"peft>=0.7.1,!=0.11.0",
"protobuf<4.0.0",
"huggingface_hub",
Expand Down Expand Up @@ -348,7 +348,7 @@ colab-ampere-torch220 = [
"flash-attn>=2.6.3",
]
colab-new = [
"unsloth_zoo>=2025.2.6",
"unsloth_zoo>=2025.2.7",
"packaging",
"tyro",
"transformers>=4.46.1,!=4.47.0",
Expand All @@ -366,7 +366,7 @@ colab-new = [
]
colab-no-deps = [
"accelerate>=0.34.1",
"trl>=0.7.9,!=0.9.0,!=0.9.1,!=0.9.2,!=0.9.3",
"trl>=0.7.9,!=0.9.0,!=0.9.1,!=0.9.2,!=0.9.3,!=0.15.0",
"peft>=0.7.1",
"xformers",
"bitsandbytes>=0.46.1",
Expand Down
5 changes: 5 additions & 0 deletions unsloth/models/_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -143,6 +143,11 @@ def filter(self, x): return not (self.text in x.getMessage())
transformers_training_args_logger.addFilter(HideLoggingMessage("torch.distributed"))
del transformers_training_args_logger

# No label_names provided for model class
from transformers.trainer import logger as transformers_trainer_logger
transformers_trainer_logger.addFilter(HideLoggingMessage("No label_names"))
del transformers_trainer_logger

# Using the default loss: `ForCausalLMLoss`.
try:
from transformers.modeling_utils import logger as transformers_modeling_utils_logger
Expand Down
5 changes: 3 additions & 2 deletions unsloth/models/llama.py
Original file line number Diff line number Diff line change
Expand Up @@ -725,8 +725,9 @@ def LlamaModel_fast_forward(
past_key_values_length,
sliding_window = getattr(self.config, "sliding_window", None),
)
if attention_mask is not None:
attention_mask = attention_mask.to(torch.bool)
# Must NOT convert to bool - weirdly this causes stuff to error out!
# if attention_mask is not None:
# attention_mask = attention_mask.to(torch.bool)
pass

hidden_states = inputs_embeds
Expand Down
7 changes: 4 additions & 3 deletions unsloth/models/rl_replacements.py
Original file line number Diff line number Diff line change
Expand Up @@ -164,10 +164,11 @@ def grpo_trainer__prepare_inputs(function_name, function):
# Remove _move_model_to_vllm
def grpo_trainer__move_model_to_vllm(function_name, function):
if function_name != "_move_model_to_vllm": return function

def _move_model_to_vllm(self, *args, **kwargs): return None

# .*? matches first match. .+? matches final match.
replacement = "def _move_model_to_vllm(self, *args, **kwargs): return None\n"
return " "*function.find("def") + replacement
function = inspect.getsource(_move_model_to_vllm)
return function
pass
RL_FUNCTIONS["grpo_trainer"].append(grpo_trainer__move_model_to_vllm)

Expand Down