pmukhop commited on
Commit
8b1ce6f
·
0 Parent(s):

initial commit rsg

Browse files
Files changed (2) hide show
  1. coalesced.pth +3 -0
  2. extended_config.yaml +250 -0
coalesced.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd0e6b17cdb97b62e41906bcb76e46bd992866238351a203c163a1d5a64e307b
3
+ size 5169595351
extended_config.yaml ADDED
@@ -0,0 +1,250 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data_workers: 10
2
+ name: Walrus_ft_convective_envelope_rsg_realglobalnorm_rusty-rsgon-delta-Isotr[Space-Adapt-Space-FullA-Axial]-AdamW-0.0001
3
+ finetune: true
4
+ automatic_setup: true
5
+ trainer:
6
+ _target_: walrus.trainer.Trainer
7
+ max_epoch: 50
8
+ val_frequency: 5
9
+ rollout_val_frequency: 5
10
+ short_validation_length: 20
11
+ max_rollout_steps: 200
12
+ num_time_intervals: 5
13
+ enable_amp: false
14
+ loss_fn:
15
+ _target_: the_well.benchmark.metrics.MAE
16
+ formatter:
17
+ _target_: hydra.utils.get_class
18
+ path: walrus.data.well_to_multi_transformer.ChannelsFirstWithTimeFormatter
19
+ revin:
20
+ _target_: walrus.trainer.normalization_strat.GlobalRevNormalization
21
+ _partial_: true
22
+ prediction_type: delta
23
+ grad_acc_steps: 1
24
+ image_validation: true
25
+ video_validation: true
26
+ gradient_log_level: 0
27
+ clip_gradient: 10
28
+ log_interval: 200
29
+ loss_multiplier: 100.0
30
+ lr_scheduler_per_step: false
31
+ skip_spectral_metrics: true
32
+ optimizer:
33
+ _target_: torch.optim.AdamW
34
+ lr: 0.0001
35
+ weight_decay: 0.0001
36
+ eps: 1.0e-10
37
+ lr_scheduler:
38
+ _target_: walrus.optim.schedulers.InverseSqrtLinearWarmupSqrtCooldown
39
+ warmup_epochs: 10
40
+ cooldown_epochs: 10
41
+ warmup_lr_factor: 0.1
42
+ cooldown_lr_factor: 0.001
43
+ model:
44
+ encoder:
45
+ _partial_: true
46
+ _target_: walrus.models.encoders.vstride_encoder.SpaceBagAdaptiveDVstrideEncoder
47
+ learned_pad: true
48
+ base_kernel_size1d:
49
+ - - 4
50
+ - 4
51
+ base_kernel_size2d:
52
+ - - 8
53
+ - 4
54
+ - - 8
55
+ - 4
56
+ base_kernel_size3d:
57
+ - - 8
58
+ - 4
59
+ - - 8
60
+ - 4
61
+ - - 8
62
+ - 4
63
+ groups: 12
64
+ kernel_scales_seq:
65
+ - - 2
66
+ - 2
67
+ - - 4
68
+ - 2
69
+ - - 4
70
+ - 4
71
+ - - 8
72
+ - 4
73
+ variable_downsample: true
74
+ variable_deterministic_ds: true
75
+ activation:
76
+ _partial_: true
77
+ _target_: torch.nn.SiLU
78
+ decoder:
79
+ _partial_: true
80
+ _target_: walrus.models.decoders.vstride_decoder.AdaptiveDVstrideDecoder
81
+ learned_pad: true
82
+ base_kernel_size1d:
83
+ - - 4
84
+ - 4
85
+ base_kernel_size2d:
86
+ - - 8
87
+ - 4
88
+ - - 8
89
+ - 4
90
+ base_kernel_size3d:
91
+ - - 8
92
+ - 4
93
+ - - 8
94
+ - 4
95
+ - - 8
96
+ - 4
97
+ groups: 12
98
+ activation:
99
+ _partial_: true
100
+ _target_: torch.nn.SiLU
101
+ processor:
102
+ space_mixing:
103
+ _partial_: true
104
+ _target_: walrus.models.spatial_blocks.full_attention.FullAttention
105
+ num_heads: 16
106
+ mlp_dim: null
107
+ time_mixing:
108
+ _partial_: true
109
+ _target_: walrus.models.temporal_blocks.axial_time_attention.AxialTimeAttention
110
+ num_heads: 16
111
+ bias_type: rel
112
+ channel_mixing:
113
+ _partial_: true
114
+ _target_: torch.nn.Identity
115
+ _partial_: true
116
+ _target_: walrus.models.spatiotemporal_blocks.space_time_split.SpaceTimeSplitBlock
117
+ norm_layer:
118
+ _partial_: true
119
+ _target_: walrus.models.shared_utils.normalization.RMSGroupNorm
120
+ _target_: walrus.models.IsotropicModel
121
+ hidden_dim: 1408
122
+ projection_dim: 48
123
+ intermediate_dim: 352
124
+ processor_blocks: 40
125
+ drop_path: 0.0
126
+ groups: 16
127
+ max_d: 3
128
+ static_axes: true
129
+ weight_tied_axes: false
130
+ causal_in_time: true
131
+ include_d:
132
+ - 2
133
+ - 3
134
+ override_dimensionality: 0
135
+ jitter_patches: true
136
+ gradient_checkpointing_freq: 2
137
+ use_periodic_fixed_jitter: true
138
+ input_field_drop: 0
139
+ data:
140
+ field_index_map_override:
141
+ closed_boundary: 0
142
+ open_boundary: 1
143
+ bias_correction: 2
144
+ pressure: 3
145
+ velocity_x: 4
146
+ velocity_y: 5
147
+ velocity_z: 6
148
+ zeros_like_density: 7
149
+ speed_of_sound: 8
150
+ concentration: 9
151
+ D_xx: 10
152
+ D_xy: 11
153
+ D_xz: 12
154
+ D_yx: 13
155
+ D_yy: 14
156
+ D_yz: 15
157
+ D_zx: 16
158
+ D_zy: 17
159
+ D_zz: 18
160
+ E_xx: 19
161
+ E_xy: 20
162
+ E_xz: 21
163
+ E_yx: 22
164
+ E_yy: 23
165
+ E_yz: 24
166
+ E_zx: 25
167
+ E_zy: 26
168
+ E_zz: 27
169
+ density: 28
170
+ energy: 29
171
+ velocity_r: 30
172
+ velocity_theta: 31
173
+ velocity_phi: 32
174
+ momentum_x: 33
175
+ momentum_y: 34
176
+ momentum_z: 35
177
+ pressure_re: 36
178
+ pressure_im: 37
179
+ mask: 38
180
+ magnetic_field_x: 39
181
+ magnetic_field_y: 40
182
+ magnetic_field_z: 41
183
+ A: 42
184
+ B: 43
185
+ height: 44
186
+ internal_energy: 45
187
+ temperature: 46
188
+ electron_fraction: 47
189
+ entropy: 48
190
+ magnetic_field_log_r: 49
191
+ magnetic_field_theta: 50
192
+ magnetic_field_phi: 51
193
+ velocity_log_r: 52
194
+ buoyancy: 53
195
+ tracer: 54
196
+ log10_density: 55
197
+ log10_temperature: 56
198
+ c_zz: 57
199
+ C_xx: 58
200
+ C_xy: 59
201
+ C_xz: 60
202
+ C_yx: 61
203
+ C_yy: 62
204
+ C_yz: 63
205
+ C_zx: 64
206
+ C_zy: 65
207
+ C_zz: 66
208
+ well_base_path: /mnt/home/polymathic/ceph/the_well/datasets/
209
+ wandb_data_name: rsgonly
210
+ module_parameters:
211
+ _target_: data.MixedWellDataModule
212
+ batch_size: 1
213
+ n_steps_input: 3
214
+ n_steps_output: 1
215
+ min_dt_stride: 5
216
+ max_dt_stride: 5
217
+ max_samples: 2000
218
+ well_dataset_info:
219
+ convective_envelope_rsg:
220
+ include_filters: []
221
+ exclude_filters: []
222
+ normalization_path: logged_stats_stride_5.yaml
223
+ auto_resume: true
224
+ folder_override: ''
225
+ checkpoint_override: ''
226
+ config_override: /mnt/home/polymathic/ceph/walrus_logging/platinum_checkpoints/extended_config.yaml
227
+ validation_mode: false
228
+ frozen_components:
229
+ - model
230
+ distribution:
231
+ distribution_type: fsdp
232
+ local_size: null
233
+ logger:
234
+ wandb: true
235
+ wandb_project_name: walrus_Finetuning_Runs
236
+ checkpoint:
237
+ _target_: walrus.trainer.checkpoints.CheckPointer
238
+ save_dir: /mnt/home/polymathic/ceph/walrus_logging/runs/Walrus_ft_convective_envelope_rsg_realglobalnorm_rusty-rsgon-delta-Isotr[Space-Adapt-Space-FullA-Axial]-AdamW-0.0001/finetune/0/checkpoints
239
+ load_checkpoint_path: null
240
+ coalesced_checkpoint_path: /mnt/home/polymathic/ceph/walrus_logging/platinum_checkpoints/final_base_model/walrus.pt
241
+ save_best: true
242
+ checkpoint_frequency: 20
243
+ finetuning_mods:
244
+ learnable_rope: true
245
+ rope_per_axis: true
246
+ ape_shape:
247
+ - 17
248
+ - 16
249
+ - 16
250
+ experiment_dir: /mnt/home/polymathic/ceph/walrus_logging/runs