diff --git a/keras/src/layers/core/dense.py b/keras/src/layers/core/dense.py index 56c86f50cbf6..8af0120c5101 100644 --- a/keras/src/layers/core/dense.py +++ b/keras/src/layers/core/dense.py @@ -23,7 +23,9 @@ class Dense(Layer): where `activation` is the element-wise activation function passed as the `activation` argument, `kernel` is a weights matrix created by the layer, and `bias` is a bias vector created by the layer - (only applicable if `use_bias` is `True`). + (only applicable if `use_bias` is `True`). When this layer is + followed by a `BatchNormalization` layer, it is recommended to set + `use_bias=False` as `BatchNormalization` has its own bias term. Note: If the input to the layer has a rank greater than 2, `Dense` computes the dot product between the `inputs` and the `kernel` along the