Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion init2winit/dataset_lib/pg19.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@

This module implements a preprocessed PG-19 dataset from TFRecords. The PG-19
textfiles were tokenized and encoded with SubwordTextEncoder and aggregated into
tensors of maximum lenght of 8192.
tensors of maximum length of 8192.
"""

import functools
Expand Down
2 changes: 1 addition & 1 deletion init2winit/model_lib/adabelief_densenet.py
Original file line number Diff line number Diff line change
Expand Up @@ -120,7 +120,7 @@ def __call__(self, x, train):
class DenseNet(nn.Module):
"""Adabelief DenseNet.

The network consists of an inital convolutaional layer, four dense blocks
The network consists of an initial convolutional layer, four dense blocks
connected by transition blocks, a pooling layer and a classification layer.
"""
num_layers: int
Expand Down
2 changes: 1 addition & 1 deletion init2winit/model_lib/base_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -308,7 +308,7 @@ def _apply_override(sharding, param_type, param_shape):
return overriden_shardings

def get_sharding(self, params, mesh):
"""Returns the overriden sharding annotations for the model.
"""Returns the overridden sharding annotations for the model.

The default sharding strategy is to replicate all layers on all devices.
Models can override get_sharding_overrides() to specify sharding overrides
Expand Down
2 changes: 1 addition & 1 deletion init2winit/optimizer_lib/kitchen_sink/_src/transform.py
Original file line number Diff line number Diff line change
Expand Up @@ -1898,7 +1898,7 @@ def update_fn(updates, state, params):
return optax.GradientTransformation(init_fn, update_fn)


# scale_by_rms exists only for backward compatability
# scale_by_rms exists only for backward compatibility
_composites = {
'scale_by_adaptive_gd': scale_by_adaptive_gd,
'scale_by_adaptive_gd_simple': scale_by_adaptive_gd_simple,
Expand Down
2 changes: 1 addition & 1 deletion init2winit/optimizer_lib/samuel.py
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ def samuel(
mw_etas: list of multiplicative weight etas.
seed: initial jax random seed.
train_loss: train loss to be injected at update time.
learning_rate: for compatability, but ignored for now.
learning_rate: for compatibility, but ignored for now.

Returns:
samuel optimizer
Expand Down
2 changes: 1 addition & 1 deletion init2winit/optimizer_lib/search_subspace.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@

"""Algorithms for narrowing hyperparameter search spaces.

TODO(dsuo): suport discrete hparams.
TODO(dsuo): support discrete hparams.
"""
import copy
import itertools
Expand Down
2 changes: 1 addition & 1 deletion init2winit/schedules.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
def _check_schedule_hparams(schedule_hparams, expected_keys):
if set(schedule_hparams.keys()) != set(expected_keys):
raise ValueError(
'Provided schedule_hparams keys are invalid. Recieved: {}, Expected: {}'
'Provided schedule_hparams keys are invalid. Received: {}, Expected: {}'
.format(sorted(schedule_hparams.keys()), sorted(expected_keys))
)

Expand Down