Skip to content

Commit d53f328

Browse files
committed
linear callback rank
1 parent e62a995 commit d53f328

File tree

2 files changed

+17
-13
lines changed

2 files changed

+17
-13
lines changed

src/lobster/callbacks/_linear_probe_callback.py

+2
Original file line numberDiff line numberDiff line change
@@ -73,6 +73,8 @@ def _skip(self, trainer: L.Trainer) -> bool:
7373
# Don't skip if global_rank=0 (main process)
7474
if trainer.global_rank == 0:
7575
return False
76+
else:
77+
return True
7678

7779
return trainer.current_epoch % self.run_every_n_epochs != 0
7880

Original file line numberDiff line numberDiff line change
@@ -1,38 +1,42 @@
11
# @package _global_
22

3-
# lobster_train experiment=train_ume logger.entity=zadorozk logger.project=lobster logger.group=ume-dev ++trainer.accelerator=gpu ++trainer.devices=auto
3+
# lobster_train experiment=train_ume ++trainer.devices=auto
44

55
defaults:
66
- override /model: modern_bert.yaml
77
- override /data: ume
8-
- override /callbacks: [base, tokens_per_second, moleculeace_linear_probe_fast, calm_linear_probe_fast]
8+
- override /callbacks: [base, moleculeace_linear_probe_fast, throughput, tokens_per_second]
9+
10+
compile: true
911

1012
data:
1113
_target_: lobster.data.UmeLightningDataModule
1214
root: ${paths.root_dir}/data
1315
datasets: ["M320M", "Calm", "AMPLIFY"]
14-
batch_size: 16
16+
batch_size: 128
1517
tokenizer_max_length: ${model.max_length}
1618
pin_memory: true
17-
shuffle_buffer_size: 10_000
18-
num_workers: 32
19+
shuffle_buffer_size: 1000
20+
num_workers: 8
1921
seed: 0
2022

2123
paths:
22-
root_dir: dev
24+
root_dir: ./runs
2325

2426
trainer:
2527
max_steps: 50_000
26-
val_check_interval: 1_000
28+
val_check_interval: 2000
2729
precision: 16-mixed
2830
gradient_clip_val: 0.5
2931
accumulate_grad_batches: 8
3032
max_time: "00:24:00:00"
31-
33+
limit_val_batches: 20_000
34+
#limit_train_batches: 1000 # for debugging
35+
#profiler: simple
3236

3337
model:
34-
model_name: UME_mini
35-
vocab_size: 627
38+
model_name: UME_medium
39+
vocab_size: 640
3640
pad_token_id: 1
3741
cls_token_id: 0
3842
mask_token_id: 4
@@ -51,10 +55,8 @@ model:
5155
callbacks:
5256
moleculeace_linear_probe:
5357
max_length: ${model.max_length}
54-
calm_linear_probe:
55-
max_length: ${model.max_length}
5658

5759
logger:
5860
name: ume_amplify_m320m_calm_${model.model_name}_${now:%Y-%m-%d_%H-%M-%S}
5961
project: lobster
60-
group: ume-dev
62+
group: ume-dev-${now:%Y-%m-%d-%H-%M-%S}

0 commit comments

Comments
 (0)