## Preamble / required packages
import numpy as np
np.random.seed(0)

## Import local plotting functions and in-notebook display functions
import matplotlib.pyplot as plt
from IPython.display import Image, display
%matplotlib inline

import warnings
## Comment this out to activate warnings
warnings.filterwarnings('ignore')


plt.style.use("dark_background")

Image('../resources/cnn.png', width=700)
# https://www.theclickreader.com/introduction-to-convolutional-neural-networks/

## load the turbulence dataset

all_vorticity_fields = list()
all_reynolds_numbers = list()

# Load simulations for different Reynolds numbers
re_vals = [300, 600, 900, 1200]
for re_val in re_vals:

    # Load the two-dimensional velocity field data. Data is stored in a 4D numpy array,
    # where the first dimension is the time index, the second and third dimensions are the
    # x and y coordinates, and the fourth dimension is the velocity components (ux or uv).
    vfield = np.load(
        f"../resources/von_karman_street/vortex_street_velocities_Re_{re_val}_largefile.npz", 
        allow_pickle=True
    )

    # Calculate the vorticity, which is the curl of the velocity field
    vort_field = np.diff(vfield, axis=1)[..., :-1, 1] + np.diff(vfield, axis=2)[:, :-1, :, 0]

    # Downsample the dataset
    vort_field = vort_field[::6, -127:, :]

    all_vorticity_fields.append(vort_field)
    all_reynolds_numbers.extend(re_val * np.ones(vort_field.shape[0]))

all_vorticity_fields = np.vstack(all_vorticity_fields)
all_reynolds_numbers = np.array(all_reynolds_numbers)

print("Vorticity field data has shape: {}".format(all_vorticity_fields.shape))
print("Reynolds number data has shape: {}".format(all_reynolds_numbers.shape))


## Plot some example snapshots of the vorticity field
fig, axes = plt.subplots(1, 4, figsize=(16, 4))
for i, (ax, re_val) in enumerate(zip(axes, re_vals)):
    ax.imshow(all_vorticity_fields[all_reynolds_numbers == re_val][0], cmap='bwr', vmin=-0.01, vmax=0.01)
    ax.set_title(f"Re = {re_val}")
    ax.axis('off')

## Convert into a machine-learning dataset by flattening features

# Flatten the vorticity field data
X = np.reshape(all_vorticity_fields, (all_vorticity_fields.shape[0], -1))
y = all_reynolds_numbers

# train test split
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

print("Training data has shape: {}".format(X.shape))
print("Training labels have shape: {}".format(y.shape))

Vorticity field data has shape: (2000, 127, 127)
Reynolds number data has shape: (2000,)
Training data has shape: (2000, 16129)
Training labels have shape: (2000,)

print(all_vorticity_fields[0].shape)
print(X[0].shape)

(127, 127)
(16129,)

nh1 = 100
nh2 = 100
nh3 = 100

print(f"Total number of a parameters: {X.shape[1] * nh1 + nh1 * nh2 +nh2 * nh3}")
## Note: I'm not including bias terms in this calculation

Total number of a parameters: 1632900

plt.figure()
plt.imshow(all_vorticity_fields[0], cmap='bwr', vmin=-0.01, vmax=0.01)
plt.title("Input Image")

## Define some possible convolutional filters
kernel1 = np.array([[0, 1, 0], [1, -4, 1], [0, 1, 0]])
kernel2 = np.array([[1, 1, 1], [1, -8, 1], [1, 1, 1]])
kernel3 = np.random.randn(20, 20)

import scipy.signal
h1 = scipy.signal.convolve2d(all_vorticity_fields[0], kernel1, mode='same')

plt.figure()
plt.imshow(h1, cmap='bwr')
plt.title("Activation pattern of first filter")

h2 = scipy.signal.convolve2d(all_vorticity_fields[0], kernel2, mode='same')

plt.figure()
plt.imshow(h2, cmap='bwr')
plt.title("Activation pattern of second filter")

h3 = scipy.signal.convolve2d(all_vorticity_fields[0], kernel3, mode='same')

plt.figure()
plt.imshow(h3, cmap='bwr')
plt.title("Activation pattern of third filter")

Text(0.5, 1.0, 'Activation pattern of third filter')

## Pool the filtered images

from scipy.ndimage.filters import maximum_filter

def max_pool(arr, n=3):
    """Pool an array by taking the maximum value of a sliding n x n window"""
    out = np.zeros_like(arr)
    for i in range(0, arr.shape[0], n):
        for j in range(0, arr.shape[1], n):
            out[i:i+n, j:j+n] = np.max(arr[i:i+n, j:j+n])

    out = out[::n, ::n]
    return out

h3_pool = max_pool(h3)

plt.figure()
plt.imshow(h3, cmap='bwr')
plt.title("Activation pattern of third filter")

plt.figure()
plt.imshow(h3_pool, cmap='bwr')
plt.title("Activation pattern of third filter pooled")

Text(0.5, 1.0, 'Activation pattern of third filter pooled')

## We are not training our models; these have random weights

class MultilayerPercepton:

    def __init__(self, input_shape, output_shape, hidden_shapes=[100, 100]):
        self.input_shape = input_shape
        self.output_shape = output_shape
        self.hidden_shapes = hidden_shapes
        self.layers = []
        for i, shape in enumerate(hidden_shapes):
            print(f"Hidden {i + 1} shape: ", (shape, input_shape))
            self.layers.append(np.random.randn(shape, input_shape))
            input_shape = shape
        print(f"Hidden {i + 2} shape: ", (output_shape, input_shape))
        self.layers.append(np.random.randn(output_shape, input_shape))

    def _sigma(self, x):
        """
        A tanh nonlinear activation function used in the neural network.
        """
        return np.tanh(x)

    def forward(self, x):
        for layer in self.layers:
            x = self._sigma(np.dot(layer, x))
        return x

            
model = MultilayerPercepton(X_train[0].shape[-1], 10, hidden_shapes=[100, 100])

model.forward(X_train[0])

Hidden 1 shape:  (100, 16129)
Hidden 2 shape:  (100, 100)
Hidden 3 shape:  (10, 100)

array([-0.99999998, -0.52595475, -0.99999941, -1.        , -0.99715747,
       -0.99999999, -0.69733068,  0.99999055, -0.99396775,  1.        ])

class ConvolutionalNeuralNetwork:
    """
    A convolutional neural network with 1 convolutional layer, 1 pooling layer, and 
    arbitrary hidden layers.
    """

    def __init__(self, input_shape, output_shape, pool_size=10, hidden_shapes=[100, 100]):
        self.input_shape = input_shape
        self.output_shape = output_shape
        self.hidden_shapes = hidden_shapes
        self.pool_size = pool_size

        self.kernel = np.random.randn(3,)
        print(f"Conv1 shape: ", self.kernel.shape)
        input_shape = (input_shape - self.kernel.shape[-1] + 1) // self.pool_size
        
        self.layers = []
        for i, shape in enumerate(hidden_shapes):
            print(f"Hidden {i + 1} shape: ", (shape, input_shape))
            self.layers.append(np.random.randn(shape, input_shape))
            input_shape = shape
        print(f"Hidden {i + 2} shape: ", (output_shape, input_shape))
        self.layers.append(np.random.randn(output_shape, input_shape))

    def _sigma(self, x):
        """
        A ReLU nonlinear activation function used in the neural network.
        """
        out = x
        out[out < 0] = 0
        return out

    def forward(self, x):

        # Convolution
        x = self._sigma(np.convolve(x, self.kernel, mode='same'))

        # Max-Pooling
        # take the max value of each 3x1 block
        all_clumps = [x[i::self.pool_size] for i in range(self.pool_size)]
        min_len = min([len(clump) for clump in all_clumps])
        all_clumps = np.array([clump[:min_len] for clump in all_clumps])
        x = all_clumps.max(axis=0)

        for layer in self.layers:
            x = self._sigma(np.dot(layer, x))
        return x

model = ConvolutionalNeuralNetwork(X_train[0].shape[-1], 10, hidden_shapes=[100, 100])

model.forward(X_train[0])

Conv1 shape:  (3,)
Hidden 1 shape:  (100, 1612)
Hidden 2 shape:  (100, 100)
Hidden 3 shape:  (10, 100)

array([0.        , 0.16714396, 0.        , 0.        , 0.4024182 ,
       0.        , 0.81681566, 0.45454396, 0.        , 1.08882927])

Image('../resources/residual.png', width=700)
# https://datascience.eu/machine-learning/an-overview-of-resnet-and-its-variants/

Image('../resources/rnn.png', width=700)
# http://cs231n.stanford.edu/slides/2021/lecture_10.pdf

Image('../resources/ae2.png', width=800)
# https://medium.com/@birla.deepak26/autoencoders-76bb49ae6a8f

Image('../resources/ae.png', width=800)
# Gilpin et al 2019, https://www.sciencedirect.com/science/article/abs/pii/S2452310020300147

Image('../resources/representations.png', width=800)

More advanced neural network types¶

More elaborate architectures and structures exist¶

Physical symmetries as a prior on model space¶

A few options¶

Many data types have implicit measures on feature space¶

Convolutional neural networks¶

We'll load the turbulence snapshot dataset to demonstrate¶

How many features does each input datapoint have?¶

How many trainable parameters would a fully-connected MLP have?¶

What do convolutional filters do?¶

Let's put it all together to see what these models might look like¶

Residual networks¶

Recurrent neural networks¶

Autoencoders¶

What else is out there?¶

Transformers¶

Variational autoencoders (and generative models in general)¶

Neural ODEs¶

Diffusion models¶