-
Notifications
You must be signed in to change notification settings - Fork 31
Expand file tree
/
Copy pathmnist_autoencoder.py
More file actions
102 lines (81 loc) · 2.45 KB
/
Copy pathmnist_autoencoder.py
File metadata and controls
102 lines (81 loc) · 2.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
# Copyright 2026 The kauldron Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
r"""Minimal example training a simple Autoencoder on MNIST.
Run:
```sh
python -m kauldron.main \
--cfg=examples/mnist_autoencoder.py \
--cfg.workdir=/tmp/kauldron_oss/workdir
```
"""
from kauldron import konfig
# pylint: disable=g-import-not-at-top
with konfig.imports():
from flax import linen as nn
from kauldron import kd
import optax
# pylint: enable=g-import-not-at-top
def get_config():
"""Get the default hyperparameter configuration."""
cfg = kd.train.Trainer()
cfg.seed = 42
# Dataset
cfg.train_ds = _make_ds(training=True)
# Model
cfg.model = kd.nn.FlatAutoencoder(
inputs="batch.image",
encoder=nn.Dense(features=128),
decoder=nn.Dense(features=28 * 28),
)
# Training
cfg.num_train_steps = 1000
# Losses
cfg.train_losses = {
"recon": kd.losses.L2(preds="preds.image", targets="batch.image"),
}
cfg.train_metrics = {
"latent_norm": kd.metrics.Norm(tensor="interms.encoder.__call__[0]"),
}
cfg.train_summaries = {
"gt": kd.summaries.ShowImages(images="batch.image", num_images=5),
"recon": kd.summaries.ShowImages(images="preds.image", num_images=5),
}
# Optimizer
cfg.schedules = {}
cfg.optimizer = optax.adam(learning_rate=0.003)
# Checkpointer
cfg.checkpointer = kd.ckpts.Checkpointer(
save_interval_steps=500,
)
cfg.evals = {
"eval": kd.evals.Evaluator(
run=kd.evals.EveryNSteps(100),
num_batches=None,
ds=_make_ds(training=False),
metrics={},
)
}
return cfg
def _make_ds(training: bool):
return kd.data.py.Tfds(
name="mnist",
split="train" if training else "test",
shuffle=True if training else False,
num_epochs=None if training else 1,
transforms=[
kd.data.Elements(keep=["image"]),
kd.data.ValueRange(key="image", vrange=(0, 1)),
],
batch_size=256,
)