Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
354 commits
Select commit Hold shift + click to select a range
1ce40ce
Bug fixes
danielhanchen Jan 20, 2025
cdb3259
fix: flash_attn_detection_error (#1556)
Zzhiter Jan 20, 2025
6701064
Merge branch 'main' into nightly
danielhanchen Jan 23, 2025
6532949
Update mapper.py
danielhanchen Jan 31, 2025
9c28145
Merge branch 'main' into nightly
danielhanchen Jan 31, 2025
5efdda2
Merge branch 'main' into nightly
danielhanchen Jan 31, 2025
ea492f2
Update gemma.py
danielhanchen Feb 2, 2025
e4c3557
Update gemma.py
danielhanchen Feb 2, 2025
ad3039b
Update gemma.py
danielhanchen Feb 2, 2025
ffe6a73
Update gemma.py
danielhanchen Feb 2, 2025
a5226eb
dim fix
danielhanchen Feb 2, 2025
e45342c
Update _utils.py
danielhanchen Feb 2, 2025
0243efb
Merge branch 'main' into nightly
danielhanchen Feb 2, 2025
c81ce12
Torch 2.6 support
danielhanchen Feb 2, 2025
fb0526b
Update llama.py
danielhanchen Feb 2, 2025
f14adf1
Update llama.py
danielhanchen Feb 2, 2025
03083b6
Update llama.py
danielhanchen Feb 2, 2025
1501195
Update llama.py
danielhanchen Feb 2, 2025
e6b93e2
Update llama.py
danielhanchen Feb 2, 2025
e550ff0
Update llama.py
danielhanchen Feb 2, 2025
99a8705
Update llama.py
danielhanchen Feb 2, 2025
f04336f
Update llama.py
danielhanchen Feb 2, 2025
b4cf11f
Update llama.py
danielhanchen Feb 2, 2025
20255ef
Update llama.py
danielhanchen Feb 2, 2025
04b0c45
Update llama.py
danielhanchen Feb 2, 2025
8e83373
Update llama.py
danielhanchen Feb 2, 2025
cd4b039
Faster inference?
danielhanchen Feb 2, 2025
c7ac842
Update llama.py
danielhanchen Feb 2, 2025
0575002
Update llama.py
danielhanchen Feb 2, 2025
cc88d1b
Update utils.py
danielhanchen Feb 2, 2025
19c4085
Update llama.py
danielhanchen Feb 2, 2025
1ff67e3
Update llama.py
danielhanchen Feb 2, 2025
8b37bc1
Update utils.py
danielhanchen Feb 2, 2025
b734d72
Update utils.py
danielhanchen Feb 2, 2025
9c7618c
Update utils.py
danielhanchen Feb 3, 2025
e530002
Update utils.py
danielhanchen Feb 3, 2025
404ac62
Update utils.py
danielhanchen Feb 3, 2025
78395a4
Update utils.py
danielhanchen Feb 3, 2025
4386c2a
Update utils.py
danielhanchen Feb 3, 2025
62fe595
Update utils.py
danielhanchen Feb 3, 2025
366ca87
Update utils.py
danielhanchen Feb 3, 2025
5d0f36a
Update utils.py
danielhanchen Feb 3, 2025
ed596d9
Update utils.py
danielhanchen Feb 3, 2025
d652dc1
Update utils.py
danielhanchen Feb 3, 2025
ec266cf
Update utils.py
danielhanchen Feb 3, 2025
b861b66
Update mapper.py
danielhanchen Feb 4, 2025
ba15116
Fast Inference via vLLM
danielhanchen Feb 5, 2025
d2aef04
Update llama.py
danielhanchen Feb 5, 2025
48bdd41
Update llama.py
danielhanchen Feb 5, 2025
2a8ba7b
Update utils.py
danielhanchen Feb 5, 2025
cf13d54
Create rl.py
danielhanchen Feb 5, 2025
38e6ec2
PatchRL
danielhanchen Feb 5, 2025
886b3c8
Update rl.py
danielhanchen Feb 5, 2025
8724b1a
Update rl.py
danielhanchen Feb 5, 2025
870bd33
Update rl.py
danielhanchen Feb 5, 2025
efa4bd8
PatchRLStatistics
danielhanchen Feb 5, 2025
3848350
Update rl.py
danielhanchen Feb 5, 2025
f8b03ee
Update rl.py
danielhanchen Feb 5, 2025
44db7fc
Update rl.py
danielhanchen Feb 5, 2025
deb7a87
Update utils.py
danielhanchen Feb 5, 2025
47c9ff3
Update utils.py
danielhanchen Feb 5, 2025
7bec3c1
Update rl.py
danielhanchen Feb 5, 2025
2c0c7b3
Update rl.py
danielhanchen Feb 5, 2025
5ccb46a
Update rl.py
danielhanchen Feb 5, 2025
eeca1a6
Update rl.py
danielhanchen Feb 5, 2025
4d1e272
Update rl.py
danielhanchen Feb 5, 2025
906055d
Update rl.py
danielhanchen Feb 5, 2025
e8ca0e7
Update rl.py
danielhanchen Feb 5, 2025
9a2999b
Update rl.py
danielhanchen Feb 5, 2025
6d92ed6
Update rl.py
danielhanchen Feb 5, 2025
2c6f31f
Update rl.py
danielhanchen Feb 5, 2025
65f991e
Update rl.py
danielhanchen Feb 5, 2025
c08c009
Update rl.py
danielhanchen Feb 5, 2025
a773af2
Update rl.py
danielhanchen Feb 5, 2025
fb24fc0
Update rl.py
danielhanchen Feb 5, 2025
30b0fa8
Update rl.py
danielhanchen Feb 5, 2025
5bb5bfb
RL metrics
danielhanchen Feb 5, 2025
0b6db78
Update rl.py
danielhanchen Feb 5, 2025
115701a
RL metrics
danielhanchen Feb 5, 2025
12038fd
Update __init__.py
danielhanchen Feb 5, 2025
e2a526e
Update rl.py
danielhanchen Feb 5, 2025
e74dbb5
Update rl.py
danielhanchen Feb 5, 2025
054ebb3
Update rl.py
danielhanchen Feb 5, 2025
4d68b9c
Update chat_templates.py
danielhanchen Feb 6, 2025
547867d
Update mapper.py
danielhanchen Feb 6, 2025
8be4bfa
Fp8 cache
danielhanchen Feb 6, 2025
9eb8bf1
Update llama.py
danielhanchen Feb 6, 2025
d2b66ca
Update llama.py
danielhanchen Feb 6, 2025
604329c
Update rl.py
danielhanchen Feb 6, 2025
2c158df
Update rl.py
danielhanchen Feb 6, 2025
43116a2
Update rl.py
danielhanchen Feb 6, 2025
656ce86
Update rl.py
danielhanchen Feb 6, 2025
832cd9b
Update rl.py
danielhanchen Feb 6, 2025
8178b32
Update rl.py
danielhanchen Feb 6, 2025
40bb945
Update rl.py
danielhanchen Feb 6, 2025
9d71ee4
Update rl.py
danielhanchen Feb 6, 2025
1ee8492
Update rl.py
danielhanchen Feb 6, 2025
58cd0c9
Update rl.py
danielhanchen Feb 6, 2025
fd347a2
Update rl.py
danielhanchen Feb 6, 2025
9d06a56
Update rl.py
danielhanchen Feb 6, 2025
00b6aa8
Update rl.py
danielhanchen Feb 6, 2025
2c2388e
Update rl.py
danielhanchen Feb 6, 2025
9e3e1ba
Update rl.py
danielhanchen Feb 6, 2025
505daf8
Update rl.py
danielhanchen Feb 6, 2025
5d53641
Update rl.py
danielhanchen Feb 6, 2025
cfb1a00
Update __init__.py
danielhanchen Feb 6, 2025
1f5a418
Update loader.py
danielhanchen Feb 6, 2025
7a8d910
Merge branch 'main' into nightly
danielhanchen Feb 6, 2025
34d92aa
Update rl.py
danielhanchen Feb 6, 2025
8b7c3af
Update rl.py
danielhanchen Feb 6, 2025
066ec25
Update _utils.py
danielhanchen Feb 6, 2025
cb90aae
Merge branch 'main' into nightly
danielhanchen Feb 7, 2025
af8a21b
Merge branch 'main' into nightly
danielhanchen Feb 10, 2025
052b93f
Update tokenizer_utils.py
danielhanchen Feb 10, 2025
fdac025
Update tokenizer_utils.py
danielhanchen Feb 10, 2025
ade058e
Better TRL handling
danielhanchen Feb 11, 2025
15073c0
Update rl.py
danielhanchen Feb 11, 2025
0c54b1e
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
a820ac6
Auto patching
danielhanchen Feb 11, 2025
15c5220
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
92a9f0b
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
61b1853
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
ea8739d
Update rl.py
danielhanchen Feb 11, 2025
61699bf
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
acbf23f
Update rl.py
danielhanchen Feb 11, 2025
b1b9af3
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
fee37b0
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
ff27094
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
6ab51be
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
b45f633
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
fd9e677
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
b9b3166
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
7fdab17
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
2595971
Update rl.py
danielhanchen Feb 11, 2025
f470f55
Update rl.py
danielhanchen Feb 11, 2025
ddfdca1
Update rl.py
danielhanchen Feb 11, 2025
3e0c7e2
Update rl.py
danielhanchen Feb 11, 2025
ae3f219
Update rl.py
danielhanchen Feb 11, 2025
5e71435
Update rl.py
danielhanchen Feb 11, 2025
883192d
Update rl.py
danielhanchen Feb 11, 2025
22c1cc1
Update rl.py
danielhanchen Feb 11, 2025
3fabc11
Update rl.py
danielhanchen Feb 11, 2025
d9687d5
Update tokenizer_utils.py
danielhanchen Feb 11, 2025
4737380
Update rl.py
danielhanchen Feb 11, 2025
6abf22a
Update rl.py
danielhanchen Feb 11, 2025
5edcdf8
Update rl.py
danielhanchen Feb 11, 2025
7e55aef
max seq length
danielhanchen Feb 11, 2025
6a21b50
Update rl.py
danielhanchen Feb 11, 2025
035d24e
Update rl.py
danielhanchen Feb 11, 2025
b67327b
Patching
danielhanchen Feb 11, 2025
56bf7a1
Update rl.py
danielhanchen Feb 11, 2025
8c23657
Update rl.py
danielhanchen Feb 11, 2025
e735ab5
Update rl.py
danielhanchen Feb 12, 2025
484afd7
Update rl.py
danielhanchen Feb 12, 2025
4a23920
Update rl.py
danielhanchen Feb 12, 2025
19b16bb
NEFTune
danielhanchen Feb 12, 2025
7e19c0f
Update rl.py
danielhanchen Feb 12, 2025
0ac3d15
Update rl.py
danielhanchen Feb 12, 2025
70b341c
Update rl.py
danielhanchen Feb 12, 2025
3b641de
Update rl.py
danielhanchen Feb 12, 2025
30ad4c4
Update rl.py
danielhanchen Feb 12, 2025
a848c01
Update rl.py
danielhanchen Feb 12, 2025
f25abe6
Update rl.py
danielhanchen Feb 12, 2025
0694463
Extra replacements
danielhanchen Feb 12, 2025
8cc0338
Update rl_replacements.py
danielhanchen Feb 12, 2025
a145a83
Update rl.py
danielhanchen Feb 12, 2025
39fbcfb
extra RL replacements
danielhanchen Feb 12, 2025
2e68bb3
Update rl_replacements.py
danielhanchen Feb 12, 2025
82d3f6a
Update rl_replacements.py
danielhanchen Feb 12, 2025
0c691cf
Update rl_replacements.py
danielhanchen Feb 12, 2025
cd6f9b6
Update rl_replacements.py
danielhanchen Feb 12, 2025
be568b0
Update rl_replacements.py
danielhanchen Feb 12, 2025
94e8298
Merge branch 'main' into nightly
danielhanchen Feb 12, 2025
9ade782
Update rl_replacements.py
danielhanchen Feb 12, 2025
e498150
Update llama.py
danielhanchen Feb 12, 2025
2a5aa3d
Update rl_replacements.py
danielhanchen Feb 12, 2025
2524538
Update _utils.py
danielhanchen Feb 12, 2025
c9ba000
Update loader_utils.py
danielhanchen Feb 12, 2025
5b2fd72
Update rl.py
danielhanchen Feb 12, 2025
3466186
Update rl_replacements.py
danielhanchen Feb 12, 2025
5dc8847
Update rl_replacements.py
danielhanchen Feb 12, 2025
9aad48e
Update rl.py
danielhanchen Feb 12, 2025
f121a5c
Update llama.py
danielhanchen Feb 12, 2025
5052d35
Update llama.py
danielhanchen Feb 12, 2025
a11aa96
Update llama.py
danielhanchen Feb 12, 2025
a6abe02
Update llama.py
danielhanchen Feb 12, 2025
d867faa
autocast
danielhanchen Feb 12, 2025
44c9228
Update rl_replacements.py
danielhanchen Feb 12, 2025
e83d854
Update llama.py
danielhanchen Feb 12, 2025
623eb65
Update rl_replacements.py
danielhanchen Feb 13, 2025
7e612f0
Update rl_replacements.py
danielhanchen Feb 13, 2025
a45266b
Update rl_replacements.py
danielhanchen Feb 13, 2025
c855d7e
Update rl_replacements.py
danielhanchen Feb 13, 2025
d7cefba
Update llama.py
danielhanchen Feb 13, 2025
52d996a
Update rl_replacements.py
danielhanchen Feb 13, 2025
56f5b31
Update llama.py
danielhanchen Feb 13, 2025
5f1e98c
Update llama.py
danielhanchen Feb 13, 2025
e713129
Update llama.py
danielhanchen Feb 13, 2025
310fc16
Update llama.py
danielhanchen Feb 13, 2025
76a122e
Update llama.py
danielhanchen Feb 13, 2025
2dd29e5
Update rl_replacements.py
danielhanchen Feb 13, 2025
3c5be91
Update llama.py
danielhanchen Feb 13, 2025
e548b15
Update llama.py
danielhanchen Feb 13, 2025
296b3b3
Update llama.py
danielhanchen Feb 13, 2025
8de588b
Update llama.py
danielhanchen Feb 13, 2025
f87909a
Update pyproject.toml
danielhanchen Feb 13, 2025
2704440
Update llama.py
danielhanchen Feb 13, 2025
42e1967
Update llama.py
danielhanchen Feb 13, 2025
36bf805
Update llama.py
danielhanchen Feb 13, 2025
a3af8e3
Update llama.py
danielhanchen Feb 13, 2025
9d10d2f
Update llama.py
danielhanchen Feb 13, 2025
b30a81f
Update llama.py
danielhanchen Feb 13, 2025
b7e8559
Update llama.py
danielhanchen Feb 13, 2025
4b201d9
Update rl_replacements.py
danielhanchen Feb 13, 2025
dc723bc
Update rl_replacements.py
danielhanchen Feb 13, 2025
0309949
Update rl_replacements.py
danielhanchen Feb 13, 2025
c409574
Update rl_replacements.py
danielhanchen Feb 13, 2025
8e5b09a
Update llama.py
danielhanchen Feb 13, 2025
6652f1d
Update rl_replacements.py
danielhanchen Feb 13, 2025
9215bbe
Update rl_replacements.py
danielhanchen Feb 13, 2025
4bff998
Update rl_replacements.py
danielhanchen Feb 13, 2025
c859030
Update rl_replacements.py
danielhanchen Feb 13, 2025
2daa8e3
Update rl_replacements.py
danielhanchen Feb 13, 2025
527a0c4
Update rl_replacements.py
danielhanchen Feb 13, 2025
087a5dc
Update rl_replacements.py
danielhanchen Feb 13, 2025
73210b3
Update rl_replacements.py
danielhanchen Feb 13, 2025
9934ac5
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
2635f2a
Update llama.py
danielhanchen Feb 13, 2025
69ab838
Update _utils.py
danielhanchen Feb 13, 2025
d5d7a06
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
c9e450f
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
44d00e8
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
447dfc4
Merge branch 'main' into nightly
danielhanchen Feb 13, 2025
acf98dc
Update llama.py
danielhanchen Feb 14, 2025
1399110
Update _utils.py
danielhanchen Feb 14, 2025
881105b
Update rl_replacements.py
danielhanchen Feb 14, 2025
cfdd3f1
Update rl.py
danielhanchen Feb 14, 2025
95b7df5
Update rl.py
danielhanchen Feb 14, 2025
17bfcf9
Update rl.py
danielhanchen Feb 14, 2025
61c219d
Update rl.py
danielhanchen Feb 14, 2025
9794dc2
Update rl.py
danielhanchen Feb 14, 2025
3687a6f
Update llama.py
danielhanchen Feb 14, 2025
c495bfa
Update llama.py
danielhanchen Feb 14, 2025
f9055a7
Update llama.py
danielhanchen Feb 14, 2025
945e3f9
Update llama.py
danielhanchen Feb 14, 2025
3d9fe12
Update rl_replacements.py
danielhanchen Feb 14, 2025
ed90785
Update llama.py
danielhanchen Feb 14, 2025
640bc88
Update llama.py
danielhanchen Feb 14, 2025
bb3bb2d
Update llama.py
danielhanchen Feb 14, 2025
9065938
Update llama.py
danielhanchen Feb 14, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion unsloth/models/_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@
# See the License for the specific language governing permissions and
# limitations under the License.

__version__ = "2025.2.8"
__version__ = "2025.2.9"

__all__ = [
"SUPPORTS_BFLOAT16",
Expand Down
5 changes: 3 additions & 2 deletions unsloth/models/llama.py
Original file line number Diff line number Diff line change
Expand Up @@ -708,7 +708,7 @@ def LlamaModel_fast_forward(
if attention_mask is None:
padding_mask = None
elif self.training:
# elif attention_mask is not None and self.training:
# elif attention_mask is None:
attention_mask = None
padding_mask = None
else:
Expand All @@ -724,7 +724,8 @@ def LlamaModel_fast_forward(
past_key_values_length,
sliding_window = getattr(self.config, "sliding_window", None),
)
attention_mask = attention_mask.to(torch.bool)
if attention_mask is not None:
attention_mask = attention_mask.to(torch.bool)
pass

hidden_states = inputs_embeds
Expand Down
8 changes: 4 additions & 4 deletions unsloth/models/rl.py
Original file line number Diff line number Diff line change
Expand Up @@ -565,8 +565,8 @@ def patch_trl_rl_trainers():


def PatchFastRL(algorithm = None, FastLanguageModel = None):
return
# if FastLanguageModel is not None: PatchRL(FastLanguageModel)
# patch_trl_rl_trainers()
# if algorithm is not None: PatchRLStatistics(algorithm)
if FastLanguageModel is not None: PatchRL(FastLanguageModel)
patch_trl_rl_trainers()
if type(algorithm) is str and algorithm.islower():
PatchRLStatistics(algorithm)
pass
25 changes: 11 additions & 14 deletions unsloth/models/rl_replacements.py
Original file line number Diff line number Diff line change
Expand Up @@ -101,23 +101,20 @@ def sft_trainer_prepare_dataset(function_name, function):

# Ignore mean_token_accuracy since it needs logits
# We override it directly with our version
def _sft_trainer_compute_loss(self, model, inputs, return_outputs = False, num_items_in_batch = None):
(loss, outputs) = super().compute_loss(
model,
inputs,
return_outputs = return_outputs,
num_items_in_batch = num_items_in_batch,
)
return (loss, outputs) if return_outputs else loss
pass

def sft_trainer_compute_loss(function_name, function):
if function_name != "compute_loss": return function

function = inspect.getsource(_sft_trainer_compute_loss)
function = function.replace("def _sft_trainer_compute_loss", "def compute_loss")
function = function.split("\n")
function = "\n".join(" "*4+x for x in function)
def compute_loss(self, model, inputs, return_outputs = False, num_items_in_batch = None):
outputs = super().compute_loss(
model,
inputs,
return_outputs = return_outputs,
num_items_in_batch = num_items_in_batch,
)
return outputs
pass

function = inspect.getsource(compute_loss)
return function
pass
RL_FUNCTIONS["sft_trainer"].append(sft_trainer_compute_loss)
Expand Down