import numpy as np

# Create some dummy data

w_hh = np.full((3, 2), 1)  # illustration purposes only, returns an array of size 3x2 filled with all 1s
w_hx = np.full((3, 3), 9)  # illustration purposes only, returns an array of size 3x3 filled with all 9s


### START CODE HERE ###
# Try using some random initializations, though it will obfuscate the join. eg: uncomment these lines
w_hh = np.random.standard_normal((3,2))
w_hx = np.random.standard_normal((3,3))
### END CODE HERE ###

print("-- Data --\n")
print("w_hh :")
print(w_hh)
print("w_hh shape :", w_hh.shape, "\n")
print("w_hx :")
print(w_hx)
print("w_hx shape :", w_hx.shape, "\n")

# Joining the arrays
print("-- Joining --\n")
# Option 1: concatenate - horizontal
w_h1 = np.concatenate((w_hh, w_hx), axis=1)
print("option 1 : concatenate\n")
print("w_h :")
print(w_h1)
print("w_h shape :", w_h1.shape, "\n")

# Option 2: hstack
w_h2 = np.hstack((w_hh, w_hx))
print("option 2 : hstack\n")
print("w_h :")
print(w_h2)
print("w_h shape :", w_h2.shape)

-- Data --

w_hh :
[[ 0.25241063 -0.58719331]
 [ 0.76074054  0.41083323]
 [ 1.39920087  0.25120103]]
w_hh shape : (3, 2) 

w_hx :
[[-0.75737614 -0.31967698  3.92355764]
 [ 1.7822747  -0.34623084  0.95240106]
 [ 1.00016719  1.17633294 -0.16451155]]
w_hx shape : (3, 3) 

-- Joining --

option 1 : concatenate

w_h :
[[ 0.25241063 -0.58719331 -0.75737614 -0.31967698  3.92355764]
 [ 0.76074054  0.41083323  1.7822747  -0.34623084  0.95240106]
 [ 1.39920087  0.25120103  1.00016719  1.17633294 -0.16451155]]
w_h shape : (3, 5) 

option 2 : hstack

w_h :
[[ 0.25241063 -0.58719331 -0.75737614 -0.31967698  3.92355764]
 [ 0.76074054  0.41083323  1.7822747  -0.34623084  0.95240106]
 [ 1.39920087  0.25120103  1.00016719  1.17633294 -0.16451155]]
w_h shape : (3, 5)

# Create some more dummy data
h_t_prev = np.full((2, 1), 1)  # illustration purposes only, returns an array of size 2x1 filled with all 1s
x_t = np.full((3, 1), 9)       # illustration purposes only, returns an array of size 3x1 filled with all 9s

# Try using some random initializations, though it will obfuscate the join. eg: uncomment these lines

### START CODE HERE ###
h_t_prev = np.random.standard_normal((2,1))
x_t = np.random.standard_normal((3,1))
### END CODE HERE ###

print("-- Data --\n")
print("h_t_prev :")
print(h_t_prev)
print("h_t_prev shape :", h_t_prev.shape, "\n")
print("x_t :")
print(x_t)
print("x_t shape :", x_t.shape, "\n")

# Joining the arrays
print("-- Joining --\n")

# Option 1: concatenate - vertical
ax_1 = np.concatenate(
    (h_t_prev, x_t), axis=0
)  # note the difference in axis parameter vs earlier
print("option 1 : concatenate\n")
print("ax_1 :")
print(ax_1)
print("ax_1 shape :", ax_1.shape, "\n")

# Option 2: vstack
ax_2 = np.vstack((h_t_prev, x_t))
print("option 2 : vstack\n")
print("ax_2 :")
print(ax_2)
print("ax_2 shape :", ax_2.shape)

-- Data --

h_t_prev :
[[ 0.61868921]
 [-0.60129131]]
h_t_prev shape : (2, 1) 

x_t :
[[1.04886699]
 [0.95044889]
 [0.9364125 ]]
x_t shape : (3, 1) 

-- Joining --

option 1 : concatenate

ax_1 :
[[ 0.61868921]
 [-0.60129131]
 [ 1.04886699]
 [ 0.95044889]
 [ 0.9364125 ]]
ax_1 shape : (5, 1) 

option 2 : vstack

ax_2 :
[[ 0.61868921]
 [-0.60129131]
 [ 1.04886699]
 [ 0.95044889]
 [ 0.9364125 ]]
ax_2 shape : (5, 1)

# Data

w_hh = np.full((3, 2), 1)  # returns an array of size 3x2 filled with all 1s
w_hx = np.full((3, 3), 9)  # returns an array of size 3x3 filled with all 9s
h_t_prev = np.full((2, 1), 1)  # returns an array of size 2x1 filled with all 1s
x_t = np.full((3, 1), 9)       # returns an array of size 3x1 filled with all 9s


# If you want to randomize the values, uncomment the next 4 lines

w_hh = np.random.standard_normal((3,2))
w_hx = np.random.standard_normal((3,3))
h_t_prev = np.random.standard_normal((2,1))
x_t = np.random.standard_normal((3,1))

# Results
print("-- Results --")
# Formula 1
stack_1 = np.hstack((w_hh, w_hx))
stack_2 = np.vstack((h_t_prev, x_t))

print("\nFormula 1")
print("Term1:\n",stack_1)
print("Term2:\n",stack_2)
formula_1 = np.matmul(np.hstack((w_hh, w_hx)), np.vstack((h_t_prev, x_t)))
print("Output:")
print(formula_1)

# Formula 2
mul_1 = np.matmul(w_hh, h_t_prev)
mul_2 = np.matmul(w_hx, x_t)
print("\nFormula 2")
print("Term1:\n",mul_1)
print("Term2:\n",mul_2)

formula_2 = np.matmul(w_hh, h_t_prev) + np.matmul(w_hx, x_t)
print("\nOutput:")
print(formula_2, "\n")

# Verification 
# np.allclose - to check if two arrays are elementwise equal upto certain tolerance, here  
# https://numpy.org/doc/stable/reference/generated/numpy.allclose.html

print("-- Verify --")
print("Results are the same :", np.allclose(formula_1, formula_2))

### START CODE HERE ###
# Try adding a sigmoid activation function and bias term as a final check
# Activation
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

# Bias and check
b = np.random.standard_normal((formula_1.shape[0],1))
print("Formula 1 Output:\n",sigmoid(formula_1+b))
print("Formula 2 Output:\n",sigmoid(formula_2+b))

all_close = np.allclose(sigmoid(formula_1+b), sigmoid(formula_2+b))
print("Results after activation are the same :",all_close)
### END CODE HERE ###

-- Results --

Formula 1
Term1:
 [[-0.39592263  0.39751634  1.36071914  0.60180462  0.96837507]
 [-1.3778533  -1.32189437  1.02989684  0.7227928   0.14193341]
 [ 1.64256453  2.27180123  0.36753557  0.85186867 -0.1212865 ]]
Term2:
 [[ 0.43211439]
 [-0.0540839 ]
 [ 0.21838975]
 [-0.26839061]
 [ 1.04678843]]
Output:
[[ 0.95674912]
 [-0.34439467]
 [ 0.31157904]]

Formula 2
Term1:
 [[-0.1925831 ]
 [-0.52389704]
 [ 0.5869079 ]]
Term2:
 [[ 1.14933222]
 [ 0.17950237]
 [-0.27532886]]

Output:
[[ 0.95674912]
 [-0.34439467]
 [ 0.31157904]] 

-- Verify --
Results are the same : True
Formula 1 Output:
 [[0.50478839]
 [0.72142739]
 [0.51120695]]
Formula 2 Output:
 [[0.50478839]
 [0.72142739]
 [0.51120695]]
Results after activation are the same : True

Hidden State Activation : Ungraded Lecture Notebook¶

Background¶

Imports¶

Joining (Concatenation)¶

Weights¶

Hidden State & Inputs¶

Verify Formulas¶

Summary¶