Skip to content
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -66,7 +66,7 @@ optional-dependencies.extra = [
# litgpt.pretrain:
"tensorboard>=2.14",
"torchmetrics>=1.3.1",
"transformers>=4.51.3,<4.52",
"transformers>=4.51.3,<4.54",
# litdata, only on non-Windows:
"uvloop>=0.2; sys_platform!='win32'",
# litgpt.data.prepare_slimpajama.py:
Expand Down
2 changes: 1 addition & 1 deletion tests/test_adapter.py
Original file line number Diff line number Diff line change
Expand Up @@ -430,7 +430,7 @@ def test_against_original_gemma_3(model_name, device, dtype):
assert x.size(1) == T
ours_y = ours_model(x)
theirs_y = theirs_model(x)["logits"].to(dtype) # HF converts logits to float
torch.testing.assert_close(ours_y, theirs_y)
torch.testing.assert_close(ours_y, theirs_y, atol=1e-4, rtol=1e-5)


def test_load_legacy_state_dict():
Expand Down
Loading