# Check versions of Keras and Tensorflow
!pip install -U keras einops
!pip list | egrep 'keras|tensorflow |jax '

import os
os.environ["KERAS_BACKEND"] = "jax"

import numpy as np
import matplotlib
import matplotlib.pyplot as plt
from pathlib import Path
import keras
import keras_cv
from keras import layers
import einops
print(f"Keras version: {keras.__version__}, backend: {keras.backend.backend()}")

Keras version: 3.0.5, backend: jax

def show_image(image, ax=None, cmap='gray'):
    if ax is None:
        ax = plt.gca()
    ax.axis('off')
    img = np.array(image)
    context = {}
    if len(img.shape) == 2 or img.shape[2] == 1:
        # grayscale
        context = {'image.cmap': cmap}
    with matplotlib.rc_context(rc=context):
        ax.imshow(img.astype('uint8'))

def show_image_grid(images, titles=None, rows=None, cols=3, title_fontsize=8, figsize=(10, 10), cmap='gray'):
    if rows is None:
        rows = (len(images) + (cols - 1)) // cols

    fig, axs = plt.subplots(rows, cols, figsize=figsize)
    # Turn off *all* axes (even those that we wouldn't show an image in)
    for ax in axs.flatten(): ax.axis('off')
    for i, ax in enumerate(axs.flatten()):
        if i >= len(images): break
        show_image(images[i], ax=ax, cmap=cmap)
        if titles is not None:
            ax.set_title(titles[i], fontsize=title_fontsize)

def get_images_from_dataset(dataset, indices):
    if hasattr(dataset, 'file_paths'):
        # FIXME: hardcoded options
        img_loader_opts = dict(target_size=(256, 256), keep_aspect_ratio=True)
        items_by_idx = {idx: keras.utils.load_img(dataset.file_paths[idx], **img_loader_opts) for idx in indices}
    else:
        items_by_idx = {idx: item for idx, (item, label) in enumerate(dataset.unbatch()) if idx in indices}
    return [items_by_idx[idx] for idx in indices]    

def channels_last_to_first(x):
    return einops.rearrange(x, 'b h w c -> b c h w')

class config:
    seed = 123
    learning_rate = 1e-3
    epochs = 1
    batch_size = 9
    image_size = (256, 256)
    model_preset = "efficientnetv2_b0_imagenet"

# Reproducibility: Set a seed so that the results are the same every time this is run.
# See https://keras.io/examples/keras_recipes/reproducibility_recipes/
keras.utils.set_random_seed(config.seed)

path_to_downloaded_file = keras.utils.get_file(
    origin="https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz",
    extract=True,
)

data_path = Path(path_to_downloaded_file).parent / 'flower_photos'
print('\t'.join([path.name for path in data_path.iterdir()]))

roses	sunflowers	daisy	dandelion	tulips	LICENSE.txt

# Define which classes we want to use, in what order.
class_names = ['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips']

# Create training and validation datasets
train_dataset, val_dataset = keras.utils.image_dataset_from_directory(
    data_path,
    validation_split=0.2,
    labels='inferred',
    class_names=class_names,
    label_mode='int',
    batch_size=config.batch_size,
    image_size=config.image_size,
    shuffle=True,
    seed=128,
    subset='both',
    crop_to_aspect_ratio=True   
)

Found 3670 files belonging to 5 classes.
Using 2936 files for training.
Using 734 files for validation.

[[images, labels]] = train_dataset.take(1)
images = images.numpy()
labels = labels.numpy()
show_image_grid(
    images,
    titles=[f"{label} ({class_names[label]})" for label in labels])

2024-03-01 11:10:26.791390: W tensorflow/core/framework/local_rendezvous.cc:404] Local rendezvous is aborting with status: OUT_OF_RANGE: End of sequence

print(images.shape)
for i in range(len(images.shape)):
    print(f"Axis {i} size is {images.shape[i]}")

(9, 256, 256, 3)
Axis 0 size is 9
Axis 1 size is 256
Axis 2 size is 256
Axis 3 size is 3

labels

array([0, 3, 0, 0, 2, 1, 1, 4, 4], dtype=int32)

class_names

['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips']

# your code here

# your code here

# your code here

# your code here

print(f"{gray_images.min()=}, {gray_images.max()=}")

gray_images.min()=0.0, gray_images.max()=253.33333333333334

# your code here

keras.utils.set_random_seed(0)
demo_conv_layer = layers.Conv2D(filters=4, kernel_size=(5, 5))

example_image = images[5]
example_image_as_batch = images[5:6]
# alternative: example_image_as_batch = np.expand_dims(example_image, axis=0)
example_image_as_batch.shape

(1, 256, 256, 3)

demo_conv_activations = demo_conv_layer(example_image_as_batch)
#demo_conv_activations.shape

show_image_grid(
    channels_last_to_first(demo_conv_activations)[0])

w, b = demo_conv_layer.get_weights()
# print(w.shape)
# print(b.shape)

# Create a model using a pretrained backbone
# See https://keras.io/api/keras_cv/models/tasks/image_classifier/ for options
model = keras_cv.models.ImageClassifier.from_preset(
    config.model_preset,
    num_classes=len(class_names))

model.backbone.summary()

Model: "efficient_net_v2b0_backbone"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ input_layer (InputLayer)        │ (None, None, None, 3)  │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ rescaling (Rescaling)           │ (None, None, None, 3)  │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ stem_conv (Conv2D)              │ (None, None, None, 32) │           864 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ stem_bn (BatchNormalization)    │ (None, None, None, 32) │           128 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ stem_activation (Activation)    │ (None, None, None, 32) │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1a_ (FusedMBConvBlock)     │ (None, None, None, 16) │         4,672 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2a_ (FusedMBConvBlock)     │ (None, None, None, 32) │        11,648 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2b_ (FusedMBConvBlock)     │ (None, None, None, 32) │        41,600 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3a_ (FusedMBConvBlock)     │ (None, None, None, 48) │        43,712 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3b_ (FusedMBConvBlock)     │ (None, None, None, 48) │        93,120 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4a_ (MBConvBlock)          │ (None, None, None, 96) │        36,108 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4b_ (MBConvBlock)          │ (None, None, None, 96) │        99,480 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4c_ (MBConvBlock)          │ (None, None, None, 96) │        99,480 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5a_ (MBConvBlock)          │ (None, None, None,     │       158,296 │
│                                 │ 112)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5b_ (MBConvBlock)          │ (None, None, None,     │       200,732 │
│                                 │ 112)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5c_ (MBConvBlock)          │ (None, None, None,     │       200,732 │
│                                 │ 112)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5d_ (MBConvBlock)          │ (None, None, None,     │       200,732 │
│                                 │ 112)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5e_ (MBConvBlock)          │ (None, None, None,     │       200,732 │
│                                 │ 112)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6a_ (MBConvBlock)          │ (None, None, None,     │       254,812 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6b_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6c_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6d_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6e_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6f_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6g_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block6h_ (MBConvBlock)          │ (None, None, None,     │       574,512 │
│                                 │ 192)                   │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ top_conv (Conv2D)               │ (None, None, None,     │       245,760 │
│                                 │ 1280)                  │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ top_bn (BatchNormalization)     │ (None, None, None,     │         5,120 │
│                                 │ 1280)                  │               │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ top_activation (Activation)     │ (None, None, None,     │             0 │
│                                 │ 1280)                  │               │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 5,919,312 (22.58 MB)

 Trainable params: 5,858,704 (22.35 MB)

 Non-trainable params: 60,608 (236.75 KB)

1/model.backbone.layers[1].scale

255.0

first_conv = model.backbone.layers[2]
w, = first_conv.get_weights()
w.shape

(3, 3, 3, 32)

first_conv_out = first_conv(images / 255.0)
first_conv_out.shape

(9, 128, 128, 32)

first_conv.strides, first_conv.padding

((2, 2), 'same')

show_image(images[5])

show_image_grid(
    channels_last_to_first(first_conv_out)[5][:9] * 255.0)

Image Operations¶

Setup¶

Configure¶

Load the data¶

Task¶

Convolution layers¶

A real conv layer¶