Skip to content

Commit cfd288f

Browse files
committed
refactoring
1 parent e44d55e commit cfd288f

File tree

2 files changed

+7
-6
lines changed

2 files changed

+7
-6
lines changed

.gitignore

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,4 @@
11
data/nextcoder-synthetic.jsonl
2-
notebook.ipynb
2+
notebook.ipynb
3+
git-credential-manager
4+
models

src/train/selekt.py

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -160,9 +160,9 @@ def selekt(base_path, save_path, alpha, rescaling, rank, trainer):
160160
non_blocking=True
161161
)
162162
delta = param - base_param
163-
print("+"*100)
164-
print(torch.sum(delta))
165-
print("+"*100)
163+
# print("+"*100)
164+
# print(torch.sum(delta))
165+
# print("+"*100)
166166
mask = torch.zeros_like(delta)
167167
_, indices = torch.topk(delta.abs().view(-1), int(alpha * delta.numel()))
168168
mask.view(-1)[indices] = 1
@@ -285,8 +285,7 @@ def train(args):
285285
gradient_checkpointing_kwargs={"use_reentrant": False},
286286
deepspeed=args.deepspeed,
287287
dataset_num_proc=80,
288-
# run_name=args.run_name,
289-
# use_liger=args.use_liger,
288+
run_name=args.run_name,
290289
)
291290

292291
rank = int(os.environ.get("RANK", "0"))

0 commit comments

Comments
 (0)