Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@ rslp/crop_type_mapping/csv/
rslp/crop_type_mapping/geoparquets/
rslp/mangrove/csv/
log*.txt
*.egg-info

# for local finetuning runs
/config.yaml
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1029,7 +1029,7 @@ model:
class_path: rslearn.models.trunk.DecoderTrunk
init_args:
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
expert_mult: 2
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1529,14 +1529,13 @@ model:
class_path: rslearn.models.trunk.DecoderTrunk
init_args:
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
expert_mult: 2
n_heads: 12
n_layers: 2
num_experts: 8
num_slots: 1
n_layers: 1
num_experts: 4
num_slots: 4
task_embedding:
class_path: rslearn.models.task_embedding.TaskChannelEmbedding
init_args:
Expand Down Expand Up @@ -1765,5 +1764,4 @@ trainer:
- 0
unfreeze_at_epoch: 20
unfreeze_lr_factor: 10
limit_val_batches: 1024
max_epochs: 200
Original file line number Diff line number Diff line change
Expand Up @@ -1217,7 +1217,7 @@ model:
class_path: rslearn.models.trunk.DecoderTrunk
init_args:
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
expert_mult: 2
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 2
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,16 +31,14 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 2
n_layers: 1
n_heads: 12
num_experts: 8
num_slots: 1
expert_mult: 2
num_experts: 4
num_slots: 4
trainer:
limit_val_batches: 1024
accumulate_grad_batches: 5

merge_options:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 2
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 1
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 1
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ global_overrides:
encoder_embedding_size: 768
add_spatial_embed: true
layers:
- class_path: rslearn.models.trunk.MoETransformer
- class_path: rslp.helios.moe.MoETransformer
init_args:
dim: 768
n_layers: 1
Expand Down
Loading
Loading