2019-10-03 22:30:36 +08:00
|
|
|
"""
|
|
|
|
This script demonstrates the implementation of the Softmax function.
|
|
|
|
|
|
|
|
Its a function that takes as input a vector of K real numbers, and normalizes
|
|
|
|
it into a probability distribution consisting of K probabilities proportional
|
|
|
|
to the exponentials of the input numbers. After softmax, the elements of the
|
|
|
|
vector always sum up to 1.
|
|
|
|
|
|
|
|
Script inspired from its corresponding Wikipedia article
|
|
|
|
https://en.wikipedia.org/wiki/Softmax_function
|
|
|
|
"""
|
|
|
|
|
|
|
|
import numpy as np
|
|
|
|
|
|
|
|
|
|
|
|
def softmax(vector):
|
|
|
|
"""
|
2020-09-10 16:31:26 +08:00
|
|
|
Implements the softmax function
|
2019-10-03 22:30:36 +08:00
|
|
|
|
2020-09-10 16:31:26 +08:00
|
|
|
Parameters:
|
|
|
|
vector (np.array,list,tuple): A numpy array of shape (1,n)
|
|
|
|
consisting of real values or a similar list,tuple
|
2019-10-03 22:30:36 +08:00
|
|
|
|
|
|
|
|
2020-09-10 16:31:26 +08:00
|
|
|
Returns:
|
|
|
|
softmax_vec (np.array): The input numpy array after applying
|
|
|
|
softmax.
|
2019-10-03 22:30:36 +08:00
|
|
|
|
2020-09-10 16:31:26 +08:00
|
|
|
The softmax vector adds up to one. We need to ceil to mitigate for
|
|
|
|
precision
|
|
|
|
>>> np.ceil(np.sum(softmax([1,2,3,4])))
|
|
|
|
1.0
|
2019-10-03 22:30:36 +08:00
|
|
|
|
2020-09-10 16:31:26 +08:00
|
|
|
>>> vec = np.array([5,5])
|
|
|
|
>>> softmax(vec)
|
|
|
|
array([0.5, 0.5])
|
2019-10-03 22:30:36 +08:00
|
|
|
|
2020-09-10 16:31:26 +08:00
|
|
|
>>> softmax([0])
|
|
|
|
array([1.])
|
2019-10-03 22:30:36 +08:00
|
|
|
"""
|
|
|
|
|
|
|
|
# Calculate e^x for each x in your vector where e is Euler's
|
|
|
|
# number (approximately 2.718)
|
2022-10-13 06:54:20 +08:00
|
|
|
exponent_vector = np.exp(vector)
|
2019-10-03 22:30:36 +08:00
|
|
|
|
|
|
|
# Add up the all the exponentials
|
2022-10-13 06:54:20 +08:00
|
|
|
sum_of_exponents = np.sum(exponent_vector)
|
2019-10-03 22:30:36 +08:00
|
|
|
|
|
|
|
# Divide every exponent by the sum of all exponents
|
2022-10-13 06:54:20 +08:00
|
|
|
softmax_vector = exponent_vector / sum_of_exponents
|
2019-10-03 22:30:36 +08:00
|
|
|
|
|
|
|
return softmax_vector
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
print(softmax((0,)))
|