Upload FIM-ODE fhn training config, logging, etc...

Browse files

Files changed (7) hide show

fhn/gridsearch_01-29-1048/finetuning_report.pdf +0 -0
fhn/gridsearch_01-29-1048/logging/tensorboard/events.out.tfevents.1769683690.ml2ran03.lamarr.tu-dortmund.de.926253.0 +3 -0
fhn/gridsearch_01-29-1048/logging/tensorboard/events.out.tfevents.1769683691.ml2ran03.lamarr.tu-dortmund.de.926253.1 +3 -0
fhn/gridsearch_01-29-1048/logging/train.log +0 -0
fhn/gridsearch_01-29-1048/model_architecture.txt +0 -0
fhn/gridsearch_01-29-1048/task_loss.log +97 -0
fhn/gridsearch_01-29-1048/train_parameters.yaml +110 -0

fhn/gridsearch_01-29-1048/finetuning_report.pdf ADDED Viewed

Binary file (10.7 kB). View file

fhn/gridsearch_01-29-1048/logging/tensorboard/events.out.tfevents.1769683690.ml2ran03.lamarr.tu-dortmund.de.926253.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d767da5a92fa8a507025bc9e2d0bd3ba611097edf6c51891494f0c323baa6ac
+size 88

fhn/gridsearch_01-29-1048/logging/tensorboard/events.out.tfevents.1769683691.ml2ran03.lamarr.tu-dortmund.de.926253.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a1a76c8b5f81f07695abcb09236f94edffac1843feaf016bead6b7d8f970a40
+size 271365

fhn/gridsearch_01-29-1048/logging/train.log ADDED Viewed

The diff for this file is too large to render. See raw diff

fhn/gridsearch_01-29-1048/model_architecture.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

fhn/gridsearch_01-29-1048/task_loss.log ADDED Viewed

	@@ -0,0 +1,97 @@

+201: 0.271
+203: 0.071
+205: 0.041
+207: 0.109
+209: 0.126
+211: 0.081
+213: 0.097
+215: 0.040
+217: 0.042
+219: 0.104
+221: 0.053
+223: 0.055
+225: 0.135
+227: 0.148
+229: 0.036
+231: 0.032
+233: 0.052
+235: 0.064
+237: 0.123
+239: 0.057
+241: 0.047
+243: 0.066
+245: 0.054
+247: 0.082
+249: 0.038
+251: 0.049
+253: 0.038
+255: 0.047
+257: 0.036
+259: 0.045
+261: 0.034
+263: 0.041
+265: 0.035
+267: 0.052
+269: 0.041
+271: 0.061
+273: 0.051
+275: 0.062
+277: 0.045
+279: 0.064
+281: 0.053
+283: 0.074
+285: 0.048
+287: 0.090
+289: 0.039
+291: 0.079
+293: 0.064
+295: 0.040
+297: 0.062
+299: 0.048
+301: 0.042
+303: 0.035
+305: 0.088
+307: 0.045
+309: 0.041
+311: 0.076
+313: 0.032
+315: 0.043
+317: 0.108
+319: 0.037
+321: 0.040
+323: 0.087
+325: 0.031
+327: 0.049
+329: 0.082
+331: 0.048
+333: 0.042
+335: 0.037
+337: 0.043
+339: 0.046
+341: 0.030
+343: 0.042
+345: 0.045
+347: 0.075
+349: 0.053
+351: 0.036
+353: 0.041
+355: 0.039
+357: 0.053
+359: 0.043
+361: 0.036
+363: 0.043
+365: 0.036
+367: 0.038
+369: 0.056
+371: 0.032
+373: 0.029
+375: 0.046
+377: 0.039
+379: 0.055
+381: 0.038
+383: 0.050
+385: 0.044
+387: 0.040
+389: 0.030
+391: 0.032
+393: 0.037

fhn/gridsearch_01-29-1048/train_parameters.yaml ADDED Viewed

	@@ -0,0 +1,110 @@

+dataset:
+  batch_size:
+    test: 1
+    train: 1
+    validation: 1
+  data_dirs:
+    test: !!python/tuple []
+    train: !!python/tuple
+    - experiments/odeon/fhn/data_gpode
+    validation: !!python/tuple
+    - experiments/odeon/fhn/data_gpode
+  dataset_name:
+    test: HeterogeneousFIMSDEDataset
+    train: StreamingFIMSDEDataset
+    validation: StreamingFIMSDEDataset
+  files_to_load:
+    locations: locations.h5
+    obs_mask: obs_mask.h5
+    obs_times: obs_times.h5
+    obs_values: obs_values.h5
+  max_dim: 3
+  name: FIMSDEDataloaderIterableDataset
+  num_locations:
+    test: null
+    train: null
+    validation: null
+  num_observations:
+    test: null
+    train: null
+    validation: null
+  num_workers:
+    test: 0
+    train: 1
+    validation: 1
+  shard:
+    test: false
+    train: false
+    validation: false
+  shuffle_elements: true
+  shuffle_locations:
+    test: false
+    train: false
+    validation: false
+  shuffle_paths: true
+distributed:
+  activation_chekpoint: false
+  checkpoint_type: full_state
+  enabled: false
+  min_num_params: 1e5
+  sharding_strategy: NO_SHARD
+  wrap_policy: SIZE_BAZED
+experiment:
+  device_map: auto
+  name: gridsearch
+  name_add_date: true
+  seed: 10
+model:
+  model_config:
+    attention_map: softmax
+    attention_method: linear
+    dim_embed: 256
+    dim_feedforward: 1024
+    dim_ffn_u_model: 1024
+    dim_hidden_u_model: 256
+    dim_max_trajectory: 3
+    dropout: 0.0
+    num_context_encoder_layers: 2
+    num_heads: 8
+    num_res_layer_u_model: 6
+    num_res_layers_functional_decoder: 8
+    use_bias_for_projection: true
+    use_bias_in_attention: true
+    use_query_residual_in_attention: true
+  model_type: TrainingWrapper
+  train_config:
+    corruption_model_type: null
+    h_max: null
+    ic_noise_scale: 0.0
+    integrator_for_trajectory_training: rk4
+    intermediate_steps_per_step: 5
+    loss_filter_nans: true
+    loss_type: l1
+    num_ic: 1
+    only_final_points_for_loss: false
+    step_noise_scale: 0.0
+    train_type: trajectory_reconstruction
+    train_with_normalized_head: true
+    traj_loss_steps: 19
+    use_h_max: false
+optimizers: !!python/tuple
+- optimizer_d:
+    gradient_norm_clipping: 1.0
+    lr: 1.0e-05
+    name: torch.optim.AdamW
+    weight_decay: 0.001
+trainer:
+  best_metric: loss
+  debug_iterations: null
+  detect_anomaly: false
+  epochs: 401
+  experiment_dir: results/fhn
+  gradient_accumulation_steps: 1
+  logging_format: RANK_%(rank)s - %(asctime)s - %(name)s - %(levelname)s - %(message)s
+  name: Trainer
+  precision: bf16mixed
+  save_every: 1
+  schedulers: !!python/tuple
+  - beta: 1.0
+    label: drift_loss_scale
+    name: fim.utils.param_scheduler.ConstantScheduler