733 lines
14 KiB
YAML
733 lines
14 KiB
YAML
name: EXAMPLE
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # Input size for the Feature Extractor (length of snippets). (=0.1s)
|
|
transforms:
|
|
- type: 'identity' # Pass the last n samples of the input data directly.
|
|
length: 8 # Number of last samples to pass directly. Use full input size if set to null.
|
|
- type: 'fourier' # Apply Fourier transform to the input data.
|
|
length: null # Use full input size if set to null. Fourier transform outputs both real and imaginary parts, doubling the size. (Computationally expensive)
|
|
- type: 'wavelet' # (Pro Tip: Discrete Meyer are great for recognizing spikes)
|
|
wavelet_type: 'dmey' # Discrete Meyer wavelets offer good frequency localization, ideal for signals with oscillatory components.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'db1' # Daubechies wavelets provide a balance between time and frequency localization.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'sym2' # Symlet wavelets are nearly symmetrical, offering improved phase characteristics over Daubechies.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'coif1' # Coiflet wavelets have more vanishing moments, suitable for capturing polynomial trends.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'bior1.3' # Biorthogonal wavelets provide perfect reconstruction and linear phase characteristics.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'rbio1.3' # Reverse Biorthogonal wavelets are similar to Biorthogonal but optimized for different applications.
|
|
length: null # Use full input size if set to null. (Computationally expensive)
|
|
- type: 'wavelet'
|
|
wavelet_type: 'haar' # Haar wavelet is simple and fast, but may not capture detailed features well.
|
|
length: null # Use full input size if set to null.
|
|
- type: 'wavelet'
|
|
wavelet_type: 'cgau1' # Complex Gaussian wavelets are used for complex-valued signal analysis and capturing phase information.
|
|
length: null # Use full input size if set to null.
|
|
|
|
latent_projector:
|
|
type: 'fc' # Type of latent projector: 'fc', 'rnn' (Recommended: fc)
|
|
latent_size: 4 # Size of the latent representation before message passing.
|
|
layer_shapes: [32, 8] # List of layer sizes for the latent projector if type is 'fc' or 'fourier'.
|
|
activations: ['ReLU', 'ReLU'] # Activation functions for the latent projector layers if type is 'fc' or 'fourier'.
|
|
rnn_hidden_size: 4 # Hidden size for the RNN projector if type is 'rnn'.
|
|
rnn_num_layers: 1 # Number of layers for the RNN projector if type is 'rnn'.
|
|
|
|
middle_out:
|
|
region_latent_size: 4 # Size of the latent representation after message passing.
|
|
residual: false # Wether to use a ResNet style setup. Requires region_latent_size = latent_size
|
|
num_peers: 3 # Number of closest peers to consider.
|
|
|
|
predictor:
|
|
layer_shapes: [3] # List of layer sizes for the predictor.
|
|
activations: ['ReLU'] # Activation functions for the predictor layers.
|
|
|
|
training:
|
|
epochs: 1024 # Number of training epochs.
|
|
batch_size: 32 # Batch size for training.
|
|
num_batches: 1 # Number of batches per epoch.
|
|
learning_rate: 0.01 # Learning rate for the optimizer.
|
|
peer_gradients_factor: 0.33 # Factor for gradients acting on predictor throught peers. 0.0 = detach gradients.
|
|
value_scale: 1 # Normalize data by dividing values by this (and multiple outputs)
|
|
eval_freq: 8 # Frequency of evaluation during training (in epochs).
|
|
save_path: models # Directory to save the best model and encoder.
|
|
|
|
evaluation:
|
|
full_compression: false # Perform full compression during evaluation.
|
|
|
|
bitstream_encoding:
|
|
type: rice # Bitstream encoding type: 'identity', 'rice', 'binomHuffman', 'bzip2', 'arithmetic' (Recommended: rice)
|
|
k: 2 # k value if type is 'rice'
|
|
|
|
data:
|
|
url: https://content.neuralink.com/compression-challenge/data.zip # URL to download the dataset.
|
|
directory: data # Directory to extract and store the dataset.
|
|
split_ratio: 0.8 # Ratio to split the data into train and test sets.
|
|
cut_length: null # Optional length to cut sequences to.
|
|
|
|
profiler:
|
|
enable: false # Enable profiler.
|
|
|
|
---
|
|
|
|
name: DEFAULT
|
|
project: Spikey_3
|
|
|
|
slurm:
|
|
name: 'Spikey_{config[name]}'
|
|
partitions:
|
|
- single
|
|
standard_output: ./reports/slurm/out_%A_%a.log
|
|
standard_error: ./reports/slurm/err_%A_%a.log
|
|
num_parallel_jobs: 50
|
|
cpus_per_task: 8
|
|
memory_per_cpu: 4000
|
|
time_limit: 1440 # in minutes
|
|
ntasks: 1
|
|
venv: '.venv/bin/activate'
|
|
sh_lines:
|
|
- 'mkdir -p {tmp}/wandb'
|
|
- 'mkdir -p {tmp}/local_pycache'
|
|
- 'export PYTHONPYCACHEPREFIX={tmp}/local_pycache'
|
|
|
|
runner: spikey
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 8
|
|
reps_per_agent: 1
|
|
|
|
wandb:
|
|
project: '{config[project]}'
|
|
group: '{config[name]}'
|
|
job_type: '{delta_desc}'
|
|
name: '{job_id}_{task_id}:{run_id}:{rand}={config[name]}_{delta_desc}'
|
|
#tags:
|
|
# - '{config[env][name]}'
|
|
# - '{config[algo][name]}'
|
|
sync_tensorboard: false
|
|
monitor_gym: false
|
|
save_code: false
|
|
|
|
evaluation:
|
|
full_compression: false
|
|
|
|
bitstream_encoding:
|
|
type: binomHuffman
|
|
|
|
data:
|
|
url: https://content.neuralink.com/compression-challenge/data.zip
|
|
directory: data
|
|
split_ratio: 0.8
|
|
cut_length: null
|
|
|
|
profiler:
|
|
enable: false
|
|
|
|
training:
|
|
eval_freq: 8
|
|
save_path: models
|
|
peer_gradients_factor: 0.25
|
|
value_scale: 1
|
|
device: cpu
|
|
|
|
middle_out:
|
|
residual: false
|
|
---
|
|
name: FC_smol_master6
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 195
|
|
transforms:
|
|
- type: 'identity' # Pass the last n samples of the input data directly.
|
|
|
|
scheduler:
|
|
reps_per_version: 8
|
|
agents_per_job: 8
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 6
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 6
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [3]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
eval_freq: 16
|
|
---
|
|
name: Smol_Feat_fourier
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: fourier
|
|
#- type: 'wavelet'
|
|
# wavelet_type: 'haar' # 'db1' # 'sym2', 'coif1', 'bior1.3', 'rbio1.3', 'dmey', 'morl', 'haar', 'cgau1'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Smol_Feat_db1_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'db1' # 'sym2', 'coif1', 'bior1.3', 'rbio1.3', 'dmey', 'morl', 'haar', 'cgau1'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Smol_Feat_sym2_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'sym2'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Smol_Feat_coif1_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'coif1'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Smol_Feat_haar_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'haar'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Smol_Feat_dmey_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 1
|
|
agents_per_job: 1
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 4
|
|
layer_shapes: [20, 6]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 4
|
|
num_peers: 2
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [2]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Proto_1
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 8
|
|
agents_per_job: 8
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_2
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 4
|
|
agents_per_job: 4
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_Light_0
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 8
|
|
agents_per_job: 8
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
---
|
|
name: Proto_3_Light_SmolInp
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: identity
|
|
length: 19
|
|
|
|
scheduler:
|
|
reps_per_version: 2
|
|
agents_per_job: 2
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_3_Light_HugeInp
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: identity
|
|
length: 1953
|
|
|
|
scheduler:
|
|
reps_per_version: 2
|
|
agents_per_job: 2
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
k: 2
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_3_Smol
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 195 # (=0.01s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 19
|
|
|
|
scheduler:
|
|
reps_per_version: 2
|
|
agents_per_job: 2
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
k: 2
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_2_k2
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 2
|
|
agents_per_job: 2
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
k: 2
|
|
|
|
evaluation:
|
|
full_compression: true
|
|
---
|
|
name: Proto_2_k4
|
|
import: $
|
|
|
|
feature_extractor:
|
|
input_size: 1953 # (=0.1s)
|
|
transforms:
|
|
- type: 'wavelet'
|
|
wavelet_type: 'dmey'
|
|
- type: identity
|
|
length: 195
|
|
|
|
scheduler:
|
|
reps_per_version: 2
|
|
agents_per_job: 2
|
|
|
|
latent_projector:
|
|
type: fc
|
|
latent_size: 8
|
|
layer_shapes: [24, 12]
|
|
activations: ['ReLU', 'ReLU']
|
|
|
|
middle_out:
|
|
region_latent_size: 8
|
|
num_peers: 3
|
|
residual: true
|
|
|
|
predictor:
|
|
layer_shapes: [4]
|
|
activations: ['ReLU']
|
|
|
|
training:
|
|
epochs: 10000
|
|
batch_size: 32
|
|
num_batches: 1
|
|
learning_rate: 0.01
|
|
device: cpu
|
|
|
|
bitstream_encoding:
|
|
type: rice
|
|
k: 4
|
|
|
|
evaluation:
|
|
full_compression: true |