2022-10-28 22:27:16 +08:00
|
|
|
"""
|
|
|
|
This script demonstrates the implementation of the Sigmoid Linear Unit (SiLU)
|
|
|
|
or swish function.
|
|
|
|
* https://en.wikipedia.org/wiki/Rectifier_(neural_networks)
|
|
|
|
* https://en.wikipedia.org/wiki/Swish_function
|
|
|
|
|
|
|
|
The function takes a vector x of K real numbers as input and returns x * sigmoid(x).
|
|
|
|
Swish is a smooth, non-monotonic function defined as f(x) = x * sigmoid(x).
|
|
|
|
Extensive experiments shows that Swish consistently matches or outperforms ReLU
|
|
|
|
on deep networks applied to a variety of challenging domains such as
|
|
|
|
image classification and machine translation.
|
|
|
|
|
|
|
|
This script is inspired by a corresponding research paper.
|
|
|
|
* https://arxiv.org/abs/1710.05941
|
|
|
|
"""
|
|
|
|
|
|
|
|
import numpy as np
|
|
|
|
|
|
|
|
|
2023-06-22 20:24:34 +08:00
|
|
|
def sigmoid(vector: np.ndarray) -> np.ndarray:
|
2022-10-28 22:27:16 +08:00
|
|
|
"""
|
|
|
|
Mathematical function sigmoid takes a vector x of K real numbers as input and
|
|
|
|
returns 1/ (1 + e^-x).
|
|
|
|
https://en.wikipedia.org/wiki/Sigmoid_function
|
|
|
|
|
|
|
|
>>> sigmoid(np.array([-1.0, 1.0, 2.0]))
|
|
|
|
array([0.26894142, 0.73105858, 0.88079708])
|
|
|
|
"""
|
|
|
|
return 1 / (1 + np.exp(-vector))
|
|
|
|
|
|
|
|
|
2023-06-22 20:24:34 +08:00
|
|
|
def sigmoid_linear_unit(vector: np.ndarray) -> np.ndarray:
|
2022-10-28 22:27:16 +08:00
|
|
|
"""
|
|
|
|
Implements the Sigmoid Linear Unit (SiLU) or swish function
|
|
|
|
|
|
|
|
Parameters:
|
2023-06-22 20:24:34 +08:00
|
|
|
vector (np.ndarray): A numpy array consisting of real values
|
2022-10-28 22:27:16 +08:00
|
|
|
|
|
|
|
Returns:
|
2023-06-22 20:24:34 +08:00
|
|
|
swish_vec (np.ndarray): The input numpy array, after applying swish
|
2022-10-28 22:27:16 +08:00
|
|
|
|
|
|
|
Examples:
|
|
|
|
>>> sigmoid_linear_unit(np.array([-1.0, 1.0, 2.0]))
|
|
|
|
array([-0.26894142, 0.73105858, 1.76159416])
|
|
|
|
|
|
|
|
>>> sigmoid_linear_unit(np.array([-2]))
|
|
|
|
array([-0.23840584])
|
|
|
|
"""
|
|
|
|
return vector * sigmoid(vector)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
import doctest
|
|
|
|
|
|
|
|
doctest.testmod()
|