initial commit, adds notes.md for instructions, adds data, adds python code

2021-07-22 22:24:50 +02:00
commit 25fa687f7f
17 changed files with 1173 additions and 0 deletions
--- a/.devcontainer/Dockerfile
+++ b/.devcontainer/Dockerfile
@ -0,0 +1,37 @@
 FROM tensorflow/tensorflow:1.13.2-gpu
 ## Install updates and network tool
 RUN apt-get update -y && apt-get upgrade -y && apt install net-tools -y
 ## Install basic functions
 RUN apt-get install sudo -y
 ## Install git
 RUN apt-get install git -y
 ## Install python requirements
 COPY requirements.txt .
 RUN pip install -r requirements.txt
 ## Create user and group
 ARG HOST_USER_UID=1000
 ARG HOST_USER_GID=1000
 RUN groupadd -g $HOST_USER_GID containergroup 
 RUN useradd -m -l -u $HOST_USER_UID -g $HOST_USER_GID containeruser 
 ## Passwordless sudo for user    
 RUN usermod -aG sudo containeruser
 RUN echo "containeruser ALL=(root) NOPASSWD:ALL" > /etc/sudoers.d/containeruser && \
    chmod 0440 /etc/sudoers.d/containeruser
 ## Activate User    
 USER containeruser
 ## Set working directory
 WORKDIR /home/containeruser
 ## Workaround for vscode bug
 ENV HOME=/home/containeruser
 ## Keep container running forever
 CMD tail -f /dev/null
--- a/.devcontainer/devcontainer.json
+++ b/.devcontainer/devcontainer.json
@ -0,0 +1,12 @@
 {
    "name": "siamese",
    "dockerComposeFile": "docker-compose.yml",
    "workspaceMount": "/workspace",
    "workspaceFolder": "/workspace",
    "service": "devcontainer",
    "shutdownAction": "stopCompose",
    "extensions": [
        "ms-python.python",
        "ms-azuretools.vscode-docker"
    ]
 }
--- a/.devcontainer/docker-compose.yml
+++ b/.devcontainer/docker-compose.yml
@ -0,0 +1,22 @@
 version: '2.3'
 services:
  devcontainer:
    build:
      context: ..
      dockerfile: .devcontainer/Dockerfile                                                                                                              
      args:
        HOST_USER_UID: 1000
        HOST_USER_GID: 1000
    network_mode: host
    environment:
      - DISPLAY=$DISPLAY
    runtime: nvidia
    volumes:
      - ..:/workspace
      - ~/.gitconfig:/home/containeruser/.gitconfig
      - ~/.ssh:/home/containeruser/.ssh
    command: sleep infinity 
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,114 @@
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
 *$py.class
 # C extensions
 *.so
 # Distribution / packaging
 .Python
 build/
 develop-eggs/
 dist/
 downloads/
 eggs/
 .eggs/
 lib/
 lib64/
 parts/
 sdist/
 var/
 wheels/
 *.egg-info/
 .installed.cfg
 *.egg
 MANIFEST
 # PyInstaller
 #  Usually these files are written by a python script from a template
 #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 *.manifest
 *.spec
 # Installer logs
 pip-log.txt
 pip-delete-this-directory.txt
 # Unit test / coverage reports
 htmlcov/
 .tox/
 .coverage
 .coverage.*
 .cache
 nosetests.xml
 coverage.xml
 *.cover
 .hypothesis/
 .pytest_cache/
 # Translations
 *.mo
 *.pot
 # Django stuff:
 *.log
 local_settings.py
 db.sqlite3
 # Flask stuff:
 instance/
 .webassets-cache
 # Scrapy stuff:
 .scrapy
 # Sphinx documentation
 docs/_build/
 # PyBuilder
 target/
 # Jupyter Notebook
 .ipynb_checkpoints
 # pyenv
 .python-version
 # celery beat schedule file
 celerybeat-schedule
 # SageMath parsed files
 *.sage.py
 # Environments
 .env
 .venv
 env/
 venv/
 ENV/
 env.bak/
 venv.bak/
 # Spyder project settings
 .spyderproject
 .spyproject
 # Rope project settings
 .ropeproject
 # mkdocs documentation
 /site
 # mypy
 .mypy_cache/
 /env
 # idea files
 .idea/
 # model checkpoint data
 checkpoint
 model_checkpoint
 siamese_checkpoint
--- a/21
+++ b/21
@ -0,0 +1,21 @@
 MIT License
 Copyright (c) 2018 aspamers
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/README.md
+++ b/README.md
@ -0,0 +1,144 @@
 # Siamese Neural Network for Keras
 This project provides a lightweight, easy to use and flexible siamese neural network module for use with the Keras 
 framework. 
 Siamese neural networks are used to generate embeddings that describe inter and extra class relationships. 
 This makes Siamese Networks like many other similarity learning algorithms suitable as a pre-training step for many 
 classification problems.
 An example of the siamese network module being used to produce a noteworthy 99.85% validation performance on the MNIST 
 dataset with no data augmentation and minimal modification from the Keras example is provided.
 ## Installation
 Create and activate a virtual environment for the project.
 ```sh
 $ virtualenv env
 $ source env/bin/activate
 ```
 To install the module directly from GitHub:
 ```
 $ pip install git+https://github.com/aspamers/siamese
 ```
 The module will install keras and numpy but no back-end (like tensorflow). This is deliberate since it leaves the module 
 decoupled from any back-end and gives you a chance to install whatever backend you prefer. 
 To install tensorflow:
 ```
 $ pip install tensorflow
 ```
 To install tensorflow with gpu support:
 ```
 $ pip install tensorflow-gpu
 ```
 ## To run examples
 With the activated virtual environment with the installed python package run the following commands.
 To run the mnist baseline example:
 ```
 $ python mnist_example.py
 ```
 To run the mnist siamese pretrained example:
 ```
 $ python mnist_siamese_example.py
 ```
 ## Usage
 For detailed usage examples please refer to the examples and unit test modules. If the instructions are not sufficient 
 feel free to make a request for improvements.
 - Import the module
 ```python
 from siamese import SiameseNetwork
 ```
 - Load or generate some data.
 ```python
 x_train = np.random.rand(100, 3)
 y_train = np.random.randint(num_classes, size=100)
 x_test = np.random.rand(30, 3)
 y_test = np.random.randint(num_classes, size=30)
 ```
 - Design a base model
 ```python
 def create_base_model(input_shape):
    model_input = Input(shape=input_shape)
    embedding = Flatten()(model_input)
    embedding = Dense(128)(embedding)
    return Model(model_input, embedding)
 ```
 - Design a head model
 ```python
 def create_head_model(embedding_shape):
    embedding_a = Input(shape=embedding_shape)
    embedding_b = Input(shape=embedding_shape)
    head = Concatenate()([embedding_a, embedding_b])
    head = Dense(4)(head)
    head = BatchNormalization()(head)
    head = Activation(activation='sigmoid')(head)
    head = Dense(1)(head)
    head = BatchNormalization()(head)
    head = Activation(activation='sigmoid')(head)
    return Model([embedding_a, embedding_b], head)
 ```
 - Create an instance of the SiameseNetwork class
 ```python
 base_model = create_base_model(input_shape)
 head_model = create_head_model(base_model.output_shape)
 siamese_network = SiameseNetwork(base_model, head_model)
 ```
 - Compile the model
 ```python
 siamese_network.compile(loss='binary_crossentropy', optimizer=keras.optimizers.adam())
 ```
 - Train the model
 ```python
 siamese_network.fit(x_train, y_train,
                    validation_data=(x_test, y_test),
                    batch_size=64,
                    epochs=epochs)
 ```
 ## Development Environment
 Create and activate a test virtual environment for the project.
 ```sh
 $ virtualenv env
 $ source env/bin/activate
 ```
 Install requirements
 ```sh
 $ pip install -r requirements.txt
 ```
 Install the backend of your choice.
 ```
 $ pip install tensorflow
 ```
 Run tests
 ```sh
 $ pytest tests/test_siamese.py
 ```
 ## Development container
 To set up the vscode development container follow the instructions at the link provided:
 https://github.com/aspamers/vscode-devcontainer
 You will also need to install the nvidia docker gpu passthrough layer:
 https://github.com/NVIDIA/nvidia-docker
--- a/1
+++ b/1
@ -0,0 +1 @@
 /home/creation/files/data/
--- a/mnist_example.py
+++ b/mnist_example.py
@ -0,0 +1,94 @@
 """
 This is a modified version of the Keras mnist example.
 https://keras.io/examples/mnist_cnn/
 Instead of using a fixed number of epochs this version continues to train
 until the stop criteria is reached.
 Model performance should be around 99.4% after training.
 """
 from __future__ import print_function
 import keras
 from keras.datasets import mnist
 from keras.layers import Conv2D, MaxPooling2D, BatchNormalization, Activation
 from keras import backend as K
 from keras.callbacks import ModelCheckpoint, EarlyStopping
 from keras.models import Model
 from keras.layers import Input, Flatten, Dense
 batch_size = 128
 num_classes = 10
 epochs = 999999
 # input image dimensions
 img_rows, img_cols = 28, 28
 # the data, split between train and test sets
 (x_train, y_train), (x_test, y_test) = mnist.load_data()
 if K.image_data_format() == 'channels_first':
    x_train = x_train.reshape(x_train.shape[0], 1, img_rows, img_cols)
    x_test = x_test.reshape(x_test.shape[0], 1, img_rows, img_cols)
    input_shape = (1, img_rows, img_cols)
 else:
    x_train = x_train.reshape(x_train.shape[0], img_rows, img_cols, 1)
    x_test = x_test.reshape(x_test.shape[0], img_rows, img_cols, 1)
    input_shape = (img_rows, img_cols, 1)
 x_train = x_train.astype('float32')
 x_test = x_test.astype('float32')
 x_train /= 255
 x_test /= 255
 y_train = keras.utils.to_categorical(y_train, num_classes)
 y_test = keras.utils.to_categorical(y_test, num_classes)
 def create_base_network(input_shape):
    input = Input(shape=input_shape)
    x = Conv2D(32, kernel_size=(3, 3),
               input_shape=input_shape)(input)
    x = BatchNormalization()(x)
    x = Activation(activation='relu')(x)
    x = MaxPooling2D(pool_size=(2, 2))(x)
    x = Conv2D(64, kernel_size=(3, 3))(x)
    x = BatchNormalization()(x)
    x = Activation(activation='relu')(x)
    x = MaxPooling2D(pool_size=(2, 2))(x)
    x = Flatten()(x)
    x = Dense(128)(x)
    x = BatchNormalization()(x)
    x = Activation(activation='relu')(x)
    x = Dense(num_classes)(x)
    x = BatchNormalization()(x)
    x = Activation(activation='softmax')(x)
    return Model(input, x)
 model = create_base_network(input_shape)
 model.compile(loss=keras.losses.categorical_crossentropy,
              optimizer=keras.optimizers.adam(),
              metrics=['accuracy'])
 checkpoint_path = "./checkpoint"
 callbacks = [
    EarlyStopping(monitor='val_acc', patience=10, verbose=0),
    ModelCheckpoint(checkpoint_path,
                    monitor='val_acc',
                    save_best_only=True,
                    verbose=0)
 ]
 model.fit(x_train, y_train,
          batch_size=batch_size,
          epochs=epochs,
          verbose=1,
          callbacks=callbacks,
          validation_data=(x_test, y_test))
 model.load_weights(checkpoint_path)
 score = model.evaluate(x_test, y_test, verbose=0)
 print('Test loss:', score[0])
 print('Test accuracy:', score[1])
--- a/mnist_siamese_example.py
+++ b/mnist_siamese_example.py
@ -0,0 +1,299 @@
 """
 This is a modified version of the Keras mnist example.
 https://keras.io/examples/mnist_cnn/
 Instead of using a fixed number of epochs this version continues to train until a stop criteria is reached.
 A siamese neural network is used to pre-train an embedding for the network. The resulting embedding is then extended
 with a softmax output layer for categorical predictions.
 Model performance should be around 99.84% after training. The resulting model is identical in structure to the one in
 the example yet shows considerable improvement in relative error confirming that the embedding learned by the siamese
 network is useful.
 """
 from __future__ import print_function
 import tensorflow.keras as keras
 from tensorflow.keras.datasets import mnist
 from tensorflow.keras.layers import Conv2D, MaxPooling2D, BatchNormalization, Activation, Concatenate
 from tensorflow.keras import backend as K
 from tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping
 from tensorflow.keras.models import Model
 from tensorflow.keras.layers import Input, Flatten, Dense
 from siamese import SiameseNetwork
 import os, math, numpy as np
 from PIL import Image
 import pdb
 batch_size = 128
 num_classes = 131
 epochs = 999999
 # input image dimensions
 img_rows, img_cols = 28, 28 
 def createTrainingData():
    base_dir = '../towards/data/fruits-360/Training/'
    train_test_split = 0.7
    no_of_files_in_each_class = 80
    #Read all the folders in the directory
    folder_list = os.listdir(base_dir)
    print( len(folder_list), "categories found in the dataset")
    #Declare training array
    cat_list = []
    x = []
    names = []
    y = []
    y_label = 0
    #Using just 5 images per category
    for folder_name in folder_list:
        files_list = os.listdir(os.path.join(base_dir, folder_name))
        temp=[]
        for file_name in files_list[:no_of_files_in_each_class]:
            temp.append(len(x))
            x.append(np.asarray(Image.open(os.path.join(base_dir, folder_name, file_name)).convert('RGB').resize((img_rows, img_cols))))
            names.append(folder_name + "/" + file_name)
            y.append(y_label)
        y_label+=1
        cat_list.append(temp)
    cat_list = np.asarray(cat_list)
    x = np.asarray(x)/255.0
    y = np.asarray(y)
    print('X, Y shape',x.shape, y.shape, cat_list.shape)
    #Training Split
    x_train, y_train, cat_train, x_val, y_val, cat_test = [], [], [], [], [], []
    train_split = math.floor((train_test_split) * no_of_files_in_each_class)
    test_split = math.floor((1-train_test_split) * no_of_files_in_each_class)
    train_count = 0
    test_count = 0
    for i in range(len(x)-1):
        if i % no_of_files_in_each_class == 0:
            cat_train.append([])
            cat_test.append([])
            class_train_count = 1
            class_test_count = 1
        if i % math.floor(1/train_test_split) == 0 and class_test_count < test_split:
            x_val.append(x[i])
            y_val.append(y[i])
            cat_test[-1].append(test_count)
            test_count += 1
            class_test_count += 1
        elif class_train_count < train_split:
            x_train.append(x[i])
            y_train.append(y[i])
            cat_train[-1].append(train_count)
            train_count += 1
            class_train_count += 1
    x_val = np.array(x_val)
    y_val = np.array(y_val)
    x_train = np.array(x_train)
    y_train = np.array(y_train)
    cat_train = np.array(cat_train)
    cat_test = np.array(cat_test)
    print('X&Y shape of training data :',x_train.shape, 'and',
            y_train.shape, cat_train.shape)
    print('X&Y shape of testing data :' , x_val.shape, 'and',
            y_val.shape, cat_test.shape)
    return (x_train, y_train), (x_val, y_val), cat_train
 # the data, split between train and test sets
 # (x_train, y_train), (x_test, y_test) = mnist.load_data()
 # channels = 1
 (x_train, y_train), (x_test, y_test), cat_train = createTrainingData()
 channels = 3
 if K.image_data_format() == 'channels_first':
    x_train = x_train.reshape(x_train.shape[0], channels, img_rows, img_cols)
    x_test = x_test.reshape(x_test.shape[0], channels, img_rows, img_cols)
    input_shape = (channels, img_rows, img_cols)
 else:
    x_train = x_train.reshape(x_train.shape[0], img_rows, img_cols, channels)
    x_test = x_test.reshape(x_test.shape[0], img_rows, img_cols, channels)
    input_shape = (img_rows, img_cols, channels)
 x_train = x_train.astype('float32')
 x_test = x_test.astype('float32')
 x_train /= 255
 x_test /= 255
 pdb.set_trace()
 def create_own_base_model(input_shape):
    model_input = Input(shape=input_shape)
    embedding = Conv2D(32, kernel_size=(10, 10), input_shape=input_shape)(model_input)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Conv2D(64, kernel_size=(7, 7))(embedding)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Conv2D(128, kernel_size=(4, 4))(embedding)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Conv2D(256, kernel_size=(4, 4))(embedding)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Flatten()(embedding)
    embedding = Dense(4096, activation='sigmoid')(embedding)
    embedding = BatchNormalization()(embedding)
    embedding = Activation(activation='relu')(embedding)
    return Model(model_input, embedding)
 def create_base_model(input_shape):
    model_input = Input(shape=input_shape)
    embedding = Conv2D(32, kernel_size=(3, 3), input_shape=input_shape)(model_input)
    embedding = BatchNormalization()(embedding)
    embedding = Activation(activation='relu')(embedding)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Conv2D(64, kernel_size=(3, 3))(embedding)
    embedding = BatchNormalization()(embedding)
    embedding = Activation(activation='relu')(embedding)
    embedding = MaxPooling2D(pool_size=(2, 2))(embedding)
    embedding = Flatten()(embedding)
    embedding = Dense(128)(embedding)
    embedding = BatchNormalization()(embedding)
    embedding = Activation(activation='relu')(embedding)
    return Model(model_input, embedding)
 def create_head_model(embedding_shape):
    embedding_a = Input(shape=embedding_shape[1:])
    embedding_b = Input(shape=embedding_shape[1:])
    head = Concatenate()([embedding_a, embedding_b])
    head = Dense(8)(head)
    head = BatchNormalization()(head)
    head = Activation(activation='sigmoid')(head)
    head = Dense(1)(head)
    head = BatchNormalization()(head)
    head = Activation(activation='sigmoid')(head)
    return Model([embedding_a, embedding_b], head)
 def get_batch(x_train, y_train, x_test, y_test, cat_train, batch_size=64):
    temp_x = x_train
    temp_cat_list = cat_train
    start=0
    batch_x=[]
    batch_y = np.zeros(batch_size)
    batch_y[int(batch_size/2):] = 1
    np.random.shuffle(batch_y)
    class_list = np.random.randint(start, len(cat_train), batch_size) 
    batch_x.append(np.zeros((batch_size, 100, 100, 3)))
    batch_x.append(np.zeros((batch_size, 100, 100, 3)))
    for i in range(0, batch_size):
        batch_x[0][i] = temp_x[np.random.choice(temp_cat_list[class_list[i]])]  
        #If train_y has 0 pick from the same class, else pick from any other class
        if batch_y[i]==0:
            r = np.random.choice(temp_cat_list[class_list[i]])
            batch_x[1][i] = temp_x[r]
        else:
            temp_list = np.append(temp_cat_list[:class_list[i]].flatten(), temp_cat_list[class_list[i]+1:].flatten())
            batch_x[1][i] = temp_x[np.random.choice(temp_list)]
    return(batch_x, batch_y)
 num_classes = 131
 epochs = 2000
 base_model = create_base_model(input_shape)
 head_model = create_head_model(base_model.output_shape)
 siamese_network = SiameseNetwork(base_model, head_model)
 siamese_network.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
 siamese_checkpoint_path = "./siamese_checkpoint"
 siamese_callbacks = [
    # EarlyStopping(monitor='val_accuracy', patience=10, verbose=0),
    ModelCheckpoint(siamese_checkpoint_path, monitor='val_accuracy', save_best_only=True, verbose=0)
 ]
 # batch_size = 64
 # for epoch in range(1, epochs):
 #     batch_x, batch_y = get_batch(x_train, y_train, x_test, y_test, cat_train, train_size, batch_size)
 #     loss = siamese_network.train_on_batch(batch_x, batch_y)
 #     print('Epoch:', epoch, ', Loss:', loss)
 siamese_network.fit(x_train, y_train,
                   validation_data=(x_test, y_test),
                   batch_size=45,
                   epochs=epochs,
                   callbacks=siamese_callbacks)
 # try: 
 #     siamese_network = keras.models.load_model(siamese_checkpoint_path)
 # except Exception as e:
 #     print(e)
 #     print("!!!!!!")
 # siamese_network.load_weights(siamese_checkpoint_path)
 embedding = base_model.outputs[-1]
 y_train = keras.utils.to_categorical(y_train)
 y_test = keras.utils.to_categorical(y_test)
 # Add softmax layer to the pre-trained embedding network
 embedding = Dense(num_classes)(embedding)
 embedding = BatchNormalization()(embedding)
 embedding = Activation(activation='sigmoid')(embedding)
 model = Model(base_model.inputs[0], embedding)
 model.compile(loss=keras.losses.binary_crossentropy,
              optimizer=keras.optimizers.Adam(),
              metrics=['accuracy'])
 model_checkpoint_path = "./model_checkpoint"
 model__callbacks = [
    # EarlyStopping(monitor='val_accuracy', patience=10, verbose=0),
    ModelCheckpoint(model_checkpoint_path, monitor='val_accuracy', save_best_only=True, verbose=0)
 ]
 # for e in range(1, epochs):
 #     batch_x, batch_y = get_batch(x_train, y_train, x_test, y_test, cat_train, train_size, batch_size)
 #     loss = model.train_on_batch(batch_x, batch_y)
 #     print('Epoch:', epoch, ', Loss:', loss)
 model.fit(x_train, y_train,
          batch_size=128,
          epochs=epochs,
          callbacks=model__callbacks,
          validation_data=(x_test, y_test))
 # try: 
 #     model = keras.models.load_model(model_checkpoint_path)
 # except Exception as e:
 #     print(e)
 #     print("!!!!!!")
 # model.load_weights(model_checkpoint_path)
 score = model.evaluate(x_test, y_test, verbose=0)
 print('Test loss:', score[0])
 print('Test accuracy:', score[1])
--- a/model.png
+++ b/model.png
--- a/mymodel.png
+++ b/mymodel.png
--- a/notes.md
+++ b/notes.md
@ -0,0 +1,39 @@
 the steps taken so far, which lead to a successfull detection of an image
 - train the model defined in mnist_siamese_example, which uses the 'siamese.py' model to
  create a siamese keras model.
  - in this mnist siamese example, the data collection has been updated form the mnist drawing
    sample to the fruit sample. Lots of work went into setting the arrays up correctly, because the
    example from towards data science did not correctly seperate the classes. He had originally used
    91 classes for teching and the rest for testing, where I now use images of every class for 
    teaching _and_ training.
  - The images were shrunken down to 28 x 28 so the model defined in the siamese example could be used
    without adaption
  - in this example, there is two teachings going on, once he trains the siamese model (which is saved under
    'siamese_checkpoint' and then he reteaches a new model based on this one, with some additonal layers ontop
    I'm not yet sure what these do [todo] but 'I'll figure it out.
 - after you've successfully trained the model, it's now saved to 'model_checkpoint' or 'siamese_checkpoint'
 - The following steps can be used to classify two images:
  Note, that it was so far only tested using images in a 'pdb' shell from the mnist_siamese_example script
 ```
 import tensorflow.keras as keras
 from PIL import image
 model = keras.models.load_model('./siamese_checkpoint')
 image1 = np.asarray(Image.open('../towards/data/fruits-360/Training/Avocado/r_254_100.jpg').convert('RGB').resize((28, 28))) / 255 / 255
 image2 = np.asarray(Image.open('../towards/data/fruits-360/Training/Avocado/r_250_100.jpg').convert('RGB').resize((28, 28))) / 255 / 255
 # note that the double division through 255 is only because the model bas taught with this double division, depends on
 # the input numbers of course 
 output = model.predict([np.array([image2]), np.array([image1])]) 
 # Note here, that the cast to np.array is nencessary - otherwise the input vector is malformed
 print(output)
 ```
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,4 @@
 keras==2.2.4
 numpy==1.16.4
 pytest==4.6.4  
 pep8==1.7.1
--- a/setup.py
+++ b/setup.py
@ -0,0 +1,15 @@
 from setuptools import setup
 setup(
    name='siamese',
    version='0.1',
    packages=[''],
    url='https://github.com/aspamers/siamese',
    license='MIT',
    author='Abram Spamers',
    author_email='aspamers@gmail.com',
    install_requires=[
        'keras', 'numpy',
    ],
    description='An easy to use Keras Siamese Neural Network implementation'
 )
--- a/siamese.py
+++ b/siamese.py
@ -0,0 +1,291 @@
 """
 Siamese neural network module.
 """
 import random, math
 import numpy as np
 from tensorflow.keras.layers import Input
 from tensorflow.keras.models import Model
 import pdb
 class SiameseNetwork:
    """
    A simple and lightweight siamese neural network implementation.
    The SiameseNetwork class requires the base and head model to be defined via the constructor. The class exposes
    public methods that allow it to behave similarly to a regular Keras model by passing kwargs through to the
    underlying keras model object where possible. This allows Keras features like callbacks and metrics to be used.
    """
    def __init__(self, base_model, head_model):
        """
        Construct the siamese model class with the following structure.
        -------------------------------------------------------------------
        input1 -> base_model |
                             --> embedding --> head_model --> binary output
        input2 -> base_model |
        -------------------------------------------------------------------
        :param base_model: The embedding model.
        * Input shape must be equal to that of data.
        :param head_model: The discriminator model.
        * Input shape must be equal to that of embedding
        * Output shape must be equal to 1..
        """
        # Set essential parameters
        self.base_model = base_model
        self.head_model = head_model
        # Get input shape from base model
        self.input_shape = self.base_model.input_shape[1:]
        # Initialize siamese model
        self.siamese_model = None
        self.__initialize_siamese_model()
    def compile(self, *args, **kwargs):
        """
        Configures the model for training.
        Passes all arguments to the underlying Keras model compile function.
        """
        self.siamese_model.compile(*args, **kwargs)
    def train_on_batch(self, *args, **kwargs):
        return self.siamese_model.train_on_batch(args[0], args[1])
    def fit(self, *args, **kwargs):
        """
        Trains the model on data generated batch-by-batch using the siamese network generator function.
        Redirects arguments to the fit_generator function.
        """
        x_train = args[0]
        y_train = args[1]
        x_test, y_test = kwargs.pop('validation_data')
        batch_size = kwargs.pop('batch_size')
        train_generator = self.__pair_generator(x_train, y_train, batch_size)
        train_steps = math.floor(max(len(x_train) / batch_size, 1))
        test_generator = self.__pair_generator(x_test, y_test, batch_size)
        test_steps = math.floor(max(len(x_test) / batch_size, 1))
        pdb.set_trace()
        self.siamese_model.fit(train_generator,
                                         steps_per_epoch=train_steps,
                                         validation_data=test_generator,
                                         validation_steps=test_steps, **kwargs)
    def fit_generator(self, x_train, y_train, x_test, y_test, batch_size, *args, **kwargs):
        """
        Trains the model on data generated batch-by-batch using the siamese network generator function.
        :param x_train: Training input data.
        :param y_train: Training output data.
        :param x_test: Validation input data.
        :param y_test: Validation output data.
        :param batch_size: Number of pairs to generate per batch.
        """
        train_generator = self.__pair_generator(x_train, y_train, batch_size)
        train_steps = max(len(x_train) / batch_size, 1)
        test_generator = self.__pair_generator(x_test, y_test, batch_size)
        test_steps = max(len(x_test) / batch_size, 1)
        self.siamese_model.fit_generator(train_generator,
                                         steps_per_epoch=train_steps,
                                         validation_data=test_generator,
                                         validation_steps=test_steps,
                                         *args, **kwargs)
    def load_weights(self, checkpoint_path):
        """
        Load siamese model weights. This also affects the reference to the base and head models.
        :param checkpoint_path: Path to the checkpoint file.
        """
        self.siamese_model.load_weights(checkpoint_path)
    def evaluate(self, *args, **kwargs):
        """
        Evaluate the siamese network with the same generator that is used to train it. Passes arguments through to the
        underlying Keras function so that callbacks etc can be used.
        Redirects arguments to the evaluate_generator function.
        :return: A tuple of scores
        """
        x = args[0]
        y = args[1]
        batch_size = kwargs.pop('batch_size')
        generator = self.__pair_generator(x, y, batch_size)
        steps = len(x) / batch_size
        return self.siamese_model.evaluate_generator(generator, steps=steps, **kwargs)
    def evaluate_generator(self, x, y, batch_size, *args, **kwargs):
        """
        Evaluate the siamese network with the same generator that is used to train it. Passes arguments through to the
        underlying Keras function so that callbacks etc can be used.
        :param x: Input data
        :param y: Class labels
        :param batch_size: Number of pairs to generate per batch.
        :return: A tuple of scores
        """
        generator = self.__pair_generator(x, y, batch_size=batch_size)
        steps = len(x) / batch_size
        return self.siamese_model.evaluate_generator(generator, steps=steps, *args, **kwargs)
    def __initialize_siamese_model(self):
        """
        Create the siamese model structure using the supplied base and head model.
        """
        input_a = Input(shape=self.input_shape)
        input_b = Input(shape=self.input_shape)
        processed_a = self.base_model(input_a)
        processed_b = self.base_model(input_b)
        head = self.head_model([processed_a, processed_b])
        self.siamese_model = Model([input_a, input_b], head)
    def __create_pairs(self, x, class_indices, batch_size, num_classes):
        """
        Create a numpy array of positive and negative pairs and their associated labels.
        :param x: Input data
        :param class_indices: A python list of lists that contains each of the indices in the input data that belong
        to each class. It is used to find and access elements in the input data that belong to a desired class.
        * Example usage:
        * element_index = class_indices[class][index]
        * element = x[element_index]
        :param batch_size: The number of pair samples to create.
        :param num_classes: number of classes in the supplied input data
        :return: A tuple of (Numpy array of pairs, Numpy array of labels)
        """
        num_pairs = batch_size / 2
        positive_pairs, positive_labels = self.__create_positive_pairs(x, class_indices, num_pairs, num_classes)
        negative_pairs, negative_labels = self.__create_negative_pairs(x, class_indices, num_pairs, num_classes)
        return np.array(positive_pairs + negative_pairs), np.array(positive_labels + negative_labels)
    def __create_positive_pairs(self, x, class_indices, num_positive_pairs, num_classes):
        """
        Create a list of positive pairs and labels. A positive pair is defined as two input samples of the same class.
        :param x: Input data
        :param class_indices: A python list of lists that contains each of the indices in the input data that belong
        to each class. It is used to find and access elements in the input data that belong to a desired class.
        * Example usage:
        * element_index = class_indices[class][index]
        * element = x[element_index]
        :param num_positive_pairs: The number of positive pair samples to create.
        :param num_classes: number of classes in the supplied input data
        :return: A tuple of (python list of positive pairs, python list of positive labels)
        """
        positive_pairs = []
        positive_labels = []
        for _ in range(int(num_positive_pairs)):
            class_1 = random.randint(0, num_classes - 1)
            num_elements = len(class_indices[class_1])
            if num_elements == 0:
                return [], []
            index_1, index_2 = self.__randint_unequal(0, num_elements - 1)
            element_index_1, element_index_2 = class_indices[class_1][index_1], class_indices[class_1][index_2]
            positive_pairs.append([x[element_index_1], x[element_index_2]])
            positive_labels.append([1.0])
        return positive_pairs, positive_labels
    def __create_negative_pairs(self, x, class_indices, num_negative_pairs, num_classes):
        """
        Create a list of negative pairs and labels. A negative pair is defined as two input samples of different class.
        :param x: Input data
        :param class_indices: A python list of lists that contains each of the indices in the input data that belong
        to each class. It is used to find and access elements in the input data that belong to a desired class.
        * Example usage:
        * element_index = class_indices[class][index]
        * element = x[element_index]
        :param num_negative_pairs: The number of negative pair samples to create.
        :param num_classes: number of classes in the supplied input data
        :return: A tuple of (python list of negative pairs, python list of negative labels)
        """
        negative_pairs = []
        negative_labels = []
        if num_classes == 0:
            return [], []
        for _ in range(int(num_negative_pairs)):
            cls_1, cls_2 = self.__randint_unequal(0, num_classes - 1)
            try:
                index_1 = random.randint(0, len(class_indices[cls_1]) - 1)
                index_2 = random.randint(0, len(class_indices[cls_2]) - 1)
            except Exception as e:
                print(e)
                pdb.set_trace()
            element_index_1, element_index_2 = class_indices[cls_1][index_1], class_indices[cls_2][index_2]
            negative_pairs.append([x[element_index_1], x[element_index_2]])
            negative_labels.append([0.0])
        return negative_pairs, negative_labels
    def __pair_generator(self, x, y, batch_size):
        """
        Creates a python generator that produces pairs from the original input data.
        :param x: Input data
        :param y: Integer class labels
        :param batch_size: The number of pair samples to create per batch.
        :return:
        """
        class_indices, num_classes = self.__get_class_indices(y)
        while True:
            pairs, labels = self.__create_pairs(x, class_indices, batch_size, num_classes)
            # The siamese network expects two inputs and one output. Split the pairs into a list of inputs.
            yield [pairs[:, 0], pairs[:, 1]], labels
    def __get_class_indices(self, y):
        """
        Create a python list of lists that contains each of the indices in the input data that belong
        to each class. It is used to find and access elements in the input data that belong to a desired class.
        * Example usage:
        * element_index = class_indices[class][index]
        * element = x[element_index]
        :param y: Integer class labels
        :return: Python list of lists
        """
        num_classes = np.max(y) + 1
        return [np.where(y == i)[0] for i in range(num_classes)], num_classes
    @staticmethod
    def __randint_unequal(lower, upper):
        """
        Get two random integers that are not equal.
        Note: In some cases (such as there being only one sample of a class) there may be an endless loop here. This
        will only happen on fairly exotic datasets though. May have to address in future.
        :param lower: Lower limit inclusive of the random integer.
        :param upper: Upper limit inclusive of the random integer. Need to use -1 for random indices.
        :return: Tuple of (integer, integer)
        """
        int_1 = random.randint(lower, upper)
        int_2 = random.randint(lower, upper)
        tries = 0
        while int_1 == int_2:
            tries += 1
            if tries > 10:
                break
            int_1 = random.randint(lower, upper)
            int_2 = random.randint(lower, upper)
        return int_1, int_2
--- a/tests/init.py
+++ b/tests/init.py
--- a/tests/test_siamese.py
+++ b/tests/test_siamese.py
@ -0,0 +1,80 @@
 """
 Tests for the siamese neural network module
 """
 import numpy as np
 import keras
 from keras import Model, Input
 from keras.layers import Concatenate, Dense, BatchNormalization, Activation
 from siamese import SiameseNetwork
 def test_siamese():
    """
    Test that all components the siamese network work correctly by executing a
    training run against generated data.
    """
    num_classes = 5
    input_shape = (3,)
    epochs = 1000
    # Generate some data
    x_train = np.random.rand(100, 3)
    y_train = np.random.randint(num_classes, size=100)
    x_test = np.random.rand(30, 3)
    y_test = np.random.randint(num_classes, size=30)
    # Define base and head model
    def create_base_model(input_shape):
        model_input = Input(shape=input_shape)
        embedding = Dense(4)(model_input)
        embedding = BatchNormalization()(embedding)
        embedding = Activation(activation='relu')(embedding)
        return Model(model_input, embedding)
    def create_head_model(embedding_shape):
        embedding_a = Input(shape=embedding_shape)
        embedding_b = Input(shape=embedding_shape)
        head = Concatenate()([embedding_a, embedding_b])
        head = Dense(4)(head)
        head = BatchNormalization()(head)
        head = Activation(activation='sigmoid')(head)
        head = Dense(1)(head)
        head = BatchNormalization()(head)
        head = Activation(activation='sigmoid')(head)
        return Model([embedding_a, embedding_b], head)
    # Create siamese neural network
    base_model = create_base_model(input_shape)
    head_model = create_head_model(base_model.output_shape)
    siamese_network = SiameseNetwork(base_model, head_model)
    # Prepare siamese network for training
    siamese_network.compile(loss='binary_crossentropy',
                            optimizer=keras.optimizers.adam())
    # Evaluate network before training to establish a baseline
    score_before = siamese_network.evaluate_generator(
        x_train, y_train, batch_size=64
    )
    # Train network
    siamese_network.fit(x_train, y_train,
                        validation_data=(x_test, y_test),
                        batch_size=64,
                        epochs=epochs)
    # Evaluate network
    score_after = siamese_network.evaluate(x_train, y_train, batch_size=64)
    # Ensure that the training loss score improved as a result of the training
    assert(score_before > score_after)