Skip to content

Commit

Permalink
change init scale
Browse files Browse the repository at this point in the history
  • Loading branch information
loreloc committed Jul 18, 2024
1 parent 1b104af commit 1324738
Show file tree
Hide file tree
Showing 2 changed files with 11 additions and 7 deletions.
6 changes: 5 additions & 1 deletion src/layers.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,11 @@ def __init__(
assert weight1.num_folds == num_folds
assert weight2.num_folds == num_folds
super().__init__(
num_input_units, num_output_units, arity=1, num_folds=num_folds, semiring=semiring
num_input_units,
num_output_units,
arity=1,
num_folds=num_folds,
semiring=semiring,
)
self._in_shape = (weight1.shape[1], weight2.shape[1])
self.weight1 = weight1
Expand Down
12 changes: 6 additions & 6 deletions src/models.py
Original file line number Diff line number Diff line change
Expand Up @@ -184,7 +184,7 @@ def __init__(
backend="torch", semiring="complex-lse-sum", fold=True, optimize=True
)
# Use a different optimization rule for the dense-kronecker pattern
self._pipeline._compiler._optimization_registry['layer_shatter'].add_rule(
self._pipeline._compiler._optimization_registry["layer_shatter"].add_rule(
apply_dense_product, signature=DenseKroneckerPattern
)
self._circuit, self._int_sq_circuit = self._build_circuits(
Expand Down Expand Up @@ -332,7 +332,7 @@ def categorical_layer_factory(
num_channels,
num_categories=input_layer_kwargs["num_categories"],
logits_factory=lambda shape: Parameter.from_leaf(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 3e-1))
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1e-1))
),
)

Expand All @@ -347,7 +347,7 @@ def gaussian_layer_factory(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1.0))
),
stddev_factory=lambda shape: Parameter.from_sequence(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 3e-1)),
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1e-1)),
ExpParameter(shape),
ClampParameter(shape, vmin=1e-5),
),
Expand All @@ -367,7 +367,7 @@ def dense_layer_factory(
num_output_units,
weight_factory=lambda shape: Parameter.from_unary(
ExpParameter(shape),
TensorParameter(*shape, initializer=NormalInitializer(0.0, 3e-1)),
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1e-1)),
),
)

Expand Down Expand Up @@ -413,7 +413,7 @@ def categorical_layer_factory(
num_channels,
num_categories=input_layer_kwargs["num_categories"],
logits_factory=lambda shape: Parameter.from_leaf(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 3e-1))
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1e-1))
),
)

Expand All @@ -428,7 +428,7 @@ def gaussian_layer_factory(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1.0))
),
stddev_factory=lambda shape: Parameter.from_sequence(
TensorParameter(*shape, initializer=NormalInitializer(0.0, 3e-1)),
TensorParameter(*shape, initializer=NormalInitializer(0.0, 1e-1)),
ExpParameter(shape),
ClampParameter(shape, vmin=1e-5),
),
Expand Down

0 comments on commit 1324738

Please sign in to comment.