Examples

This repository contains runnable example scripts in examples/:

`example_act.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Example the usage of activation functions in qkeras."""

import numpy as np

from qkeras import (
    bernoulli,
    binary,
    hard_sigmoid,
    hard_tanh,
    quantized_bits,
    quantized_po2,
    quantized_relu,
    quantized_relu_po2,
    quantized_tanh,
    set_internal_sigmoid,
    smooth_sigmoid,
    smooth_tanh,
    stochastic_binary,
    stochastic_ternary,
    ternary,
)


def main():
    # check the mean value of samples from stochastic_rounding for po2

    count = 100000
    val = 42
    a = np.array([val] * count)
    b = quantized_po2(use_stochastic_rounding=True)(a)
    res = np.sum(b.numpy()) / count
    print(res, "should be close to ", val)
    b = quantized_relu_po2(use_stochastic_rounding=True)(a)
    res = np.sum(b.numpy()) / count
    print(res, "should be close to ", val)
    a = np.array([-1] * count)
    b = quantized_relu_po2(use_stochastic_rounding=True)(a)
    res = np.sum(b.numpy()) / count
    print(res, "should be all ", 0)

    # non-stochastic rounding quantizer.
    a = np.array([-3.0, -2.0, -1.0, -0.5, 0.0, 0.5, 1.0, 2.0, 3.0])
    a = np.array([0.194336])
    print(" a =", a.astype("float16"))
    print("qa =", quantized_relu(6, 2)(a).numpy().astype("float16"))
    print("ss =", smooth_sigmoid(a).numpy().astype("float16"))
    print("hs =", hard_sigmoid(a).numpy().astype("float16"))
    print("ht =", hard_tanh(a).numpy().astype("float16"))
    print("st =", smooth_tanh(a).numpy().astype("float16"))
    c = np.array(np.arange(-1.5, 1.51, 0.3), dtype="float32")
    print(" c =", c.astype("float16"))
    print("qb_111 =", quantized_bits(1, 1, 1)(c).numpy().astype("float16"))
    print("qb_210 =", quantized_bits(2, 1, 0)(c).numpy().astype("float16"))
    print("qb_211 =", quantized_bits(2, 1, 1)(c).numpy().astype("float16"))
    print("qb_300 =", quantized_bits(3, 0, 0)(c).numpy().astype("float16"))
    print("qb_301 =", quantized_bits(3, 0, 1)(c).numpy().astype("float16"))

    c_1000 = np.array(np.array([list(c)] * 1000), dtype="float32")
    b = np.sum(bernoulli()(c_1000).numpy().astype(np.int32), axis=0) / 1000.0
    print("       hs =", hard_sigmoid(c).numpy().astype("float16"))
    print("    b_all =", b.astype("float16"))

    T = 0.0
    t = stochastic_ternary(alpha="auto")(c_1000).numpy()
    for i in range(10):
        print(f"stochastic_ternary({i}) =", t[i])
    print(
        "   st_all =",
        np.round(
            np.sum(t.astype("float32"), axis=0).astype("float16") / 1000.0, 2
        ).astype("float16"),
    )

    print("  ternary =", ternary(threshold=0.5)(c).numpy().astype(np.int32))
    print(" c =", c.astype("float16"))
    print(" b_10 =", binary(1)(c).numpy().astype("float16"))
    print("qr_10 =", quantized_relu(1, 0)(c).numpy().astype("float16"))
    print("qr_11 =", quantized_relu(1, 1)(c).numpy().astype("float16"))
    print("qr_20 =", quantized_relu(2, 0)(c).numpy().astype("float16"))
    print("qr_21 =", quantized_relu(2, 1)(c).numpy().astype("float16"))
    print("qr_101 =", quantized_relu(1, 0, 1)(c).numpy().astype("float16"))
    print("qr_111 =", quantized_relu(1, 1, 1)(c).numpy().astype("float16"))
    print("qr_201 =", quantized_relu(2, 0, 1)(c).numpy().astype("float16"))
    print("qr_211 =", quantized_relu(2, 1, 1)(c).numpy().astype("float16"))
    print("qt_200 =", quantized_tanh(2, 0)(c).numpy().astype("float16"))
    print("qt_210 =", quantized_tanh(2, 1)(c).numpy().astype("float16"))
    print("qt_201 =", quantized_tanh(2, 0, 1)(c).numpy().astype("float16"))
    print("qt_211 =", quantized_tanh(2, 1, 1)(c).numpy().astype("float16"))

    set_internal_sigmoid("smooth")
    print("with smooth sigmoid")
    print("qr_101 =", quantized_relu(1, 0, 1)(c).numpy().astype("float16"))
    print("qr_111 =", quantized_relu(1, 1, 1)(c).numpy().astype("float16"))
    print("qr_201 =", quantized_relu(2, 0, 1)(c).numpy().astype("float16"))
    print("qr_211 =", quantized_relu(2, 1, 1)(c).numpy().astype("float16"))
    print("qt_200 =", quantized_tanh(2, 0)(c).numpy().astype("float16"))
    print("qt_210 =", quantized_tanh(2, 1)(c).numpy().astype("float16"))
    print("qt_201 =", quantized_tanh(2, 0, 1)(c).numpy().astype("float16"))
    print("qt_211 =", quantized_tanh(2, 1, 1)(c).numpy().astype("float16"))

    set_internal_sigmoid("real")
    print("with real sigmoid")
    print("qr_101 =", quantized_relu(1, 0, 1)(c).numpy().astype("float16"))
    print("qr_111 =", quantized_relu(1, 1, 1)(c).numpy().astype("float16"))
    print("qr_201 =", quantized_relu(2, 0, 1)(c).numpy().astype("float16"))
    print("qr_211 =", quantized_relu(2, 1, 1)(c).numpy().astype("float16"))
    print("qt_200 =", quantized_tanh(2, 0)(c).numpy().astype("float16"))
    print("qt_210 =", quantized_tanh(2, 1)(c).numpy().astype("float16"))
    print("qt_201 =", quantized_tanh(2, 0, 1)(c).numpy().astype("float16"))
    print("qt_211 =", quantized_tanh(2, 1, 1)(c).numpy().astype("float16"))

    set_internal_sigmoid("hard")
    print(" c =", c.astype("float16"))
    print("q2_31 =", quantized_po2(3, 1)(c).numpy().astype("float16"))
    print("q2_32 =", quantized_po2(3, 2)(c).numpy().astype("float16"))
    print("qr2_21 =", quantized_relu_po2(2, 1)(c).numpy().astype("float16"))
    print("qr2_22 =", quantized_relu_po2(2, 2)(c).numpy().astype("float16"))
    print("qr2_44 =", quantized_relu_po2(4, 1)(c).numpy().astype("float16"))

    print("q2_32_2 =", quantized_relu_po2(32, 2)(c).numpy().astype("float16"))

    b = stochastic_binary()(c_1000).numpy().astype(np.int32)
    for i in range(5):
        print(f"sbinary({i}) =", b[i])
    print("sbinary =", np.round(np.sum(b, axis=0) / 1000.0, 2).astype("float16"))
    print(" binary =", binary()(c).numpy().astype(np.int32))
    print(" c      =", c.astype("float16"))

    for i in range(10):
        print(
            f" s_bin({i}) =",
            binary(use_stochastic_rounding=1)(c).numpy().astype(np.int32),
        )
    for i in range(10):
        print(
            f" s_po2({i}) =",
            quantized_po2(use_stochastic_rounding=1)(c).numpy().astype(np.int32),
        )
    for i in range(10):
        print(
            f" s_relu_po2({i}) =",
            quantized_relu_po2(use_stochastic_rounding=1)(c).numpy().astype(np.int32),
        )


if __name__ == "__main__":
    main()

`example_cifar10_po2.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests qcore model with po2."""


import os

import keras.ops.numpy as knp
from keras.datasets import cifar10
from keras.layers import *
from keras.models import Model
from keras.optimizers import *
from keras.utils import to_categorical

from qkeras import *

NB_EPOCH = 50
BATCH_SIZE = 64
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001)
VALIDATION_SPLIT = 0.1

(x_train, y_train), (x_test, y_test) = cifar10.load_data()

x_train = x_train.astype(float)
x_test = x_test.astype(float)

x_train /= 255.0
x_test /= 255.0

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

x = x_in = Input(x_train.shape[1:], name="input")
x = QActivation("quantized_relu_po2(4,4)", name="acti")(x)
x = QConv2D(
    128,
    (3, 3),
    strides=1,
    kernel_quantizer=quantized_po2(4, 1),
    bias_quantizer=quantized_po2(4, 4),
    bias_range=4,
    name="conv2d_0_m",
)(x)
x = QActivation("ternary()", name="act0_m")(x)
x = MaxPooling2D(2, 2, name="mp_0")(x)
x = QConv2D(
    256,
    (3, 3),
    strides=1,
    kernel_quantizer=quantized_po2(4, 1),
    bias_quantizer=quantized_po2(4, 4),
    bias_range=4,
    name="conv2d_1_m",
)(x)
x = QActivation("quantized_relu(6,2)", name="act1_m")(x)
x = MaxPooling2D(2, 2, name="mp_1")(x)
x = QConv2D(
    128,
    (3, 3),
    strides=1,
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="conv2d_2_m",
)(x)
x = QActivation("quantized_relu(4,2)", name="act2_m")(x)
x = MaxPooling2D(2, 2, name="mp_2")(x)
x = Flatten()(x)
x = QDense(
    NB_CLASSES,
    kernel_quantizer=quantized_ulaw(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="dense",
)(x)
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in], outputs=[x])
model.summary()

model.compile(
    loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
)

if int(os.environ.get("TRAIN", 0)):
    history = model.fit(
        x_train,
        y_train,
        batch_size=BATCH_SIZE,
        epochs=NB_EPOCH,
        initial_epoch=1,
        verbose=VERBOSE,
        validation_split=VALIDATION_SPLIT,
    )

    outputs = []
    output_names = []

    for layer in model.layers:
        if layer.__class__.__name__ in [
            "QActivation",
            "Activation",
            "QDense",
            "QConv2D",
            "QDepthwiseConv2D",
        ]:
            output_names.append(layer.name)
            outputs.append(layer.output)

    model_debug = Model(inputs=[x_in], outputs=outputs)

    outputs = model_debug.predict(x_train)

    print("{:30} {: 8.4f} {: 8.4f}".format("input", knp.min(x_train), knp.max(x_train)))

    for n, p in zip(output_names, outputs):
        print(f"{n:30} {knp.min(p): 8.4f} {knp.max(p): 8.4f}", end="")
        layer = model.get_layer(n)
        for i, weights in enumerate(layer.get_weights()):
            weights = layer.get_quantizers()[i](weights)
            print(
                f" ({knp.min(weights): 8.4f} {knp.max(weights): 8.4f})", end=""
            )
            print("")

    score = model.evaluate(x_test, y_test, verbose=VERBOSE)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])

model.summary()

print_qstats(model)

`example_ternary.py`

# Copyright 2020 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

import keras.ops.numpy as knp
import matplotlib
import numpy as np
from absl import app, flags

matplotlib.use("TkAgg")
import matplotlib.pyplot as plt

FLAGS = flags.FLAGS


def _stochastic_rounding(x, precision, resolution, delta):
    """Stochastic_rounding for ternary.

    Args:
      x:
      precision: A float. The area we want to make this stochastic rounding.
         [delta-precision, delta] [delta, delta+precision]
      resolution: control the quantization resolution.
      delta: the undiscountinued point (positive number)

    Return:
      A tensor with stochastic rounding numbers.
    """
    delta_left = delta - precision
    delta_right = delta + precision
    scale = 1 / resolution
    scale_delta_left = delta_left * scale
    scale_delta_right = delta_right * scale
    scale_2_delta = scale_delta_right - scale_delta_left
    scale_x = x * scale
    fraction = scale_x - scale_delta_left
    # print(precision, scale, x[0], knp.floor(scale_x[0]), scale_x[0], fraction[0])

    # we use uniform distribution
    random_selector = np.random.uniform(0, 1, size=x.shape) * scale_2_delta

    # print(precision, scale, x[0], delta_left[0], delta_right[0])
    # print('x', scale_x[0], fraction[0], random_selector[0], scale_2_delta[0])
    # rounddown = fraction < random_selector
    result = knp.where(
        fraction < random_selector, scale_delta_left / scale, scale_delta_right / scale
    )
    return result


def _ternary(x, sto=False):
    m = knp.amax(knp.abs(x), keepdims=True)
    scale = 2 * m / 3.0
    thres = scale / 2.0
    ratio = 0.1

    if sto:
        sign_bit = knp.sign(x)
        x = knp.abs(x)
        prec = x / scale
        x = (
            sign_bit
            * scale
            * _stochastic_rounding(
                x / scale,
                precision=0.3,
                resolution=0.01,  # those two are all normalized.
                delta=thres / scale,
            )
        )
        # prec + prec *ratio)
        # mm = knp.amax(knp.abs(x), keepdims=True)
    return knp.where(knp.abs(x) < thres, knp.zeros_like(x), knp.sign(x))


def main(argv):
    if len(argv) > 1:
        raise app.UsageError("Too many command-line arguments.")

    # x = knp.arange(-3.0, 3.0, 0.01)
    # x = np.random.uniform(-0.01, 0.01, size=1000)
    x = np.random.uniform(-10.0, 10.0, size=1000)
    # x = np.random.uniform(-1, 1, size=1000)
    x = knp.sort(x)
    tr = knp.zeros_like(x)
    t = knp.zeros_like(x)
    iter_count = 500
    for _ in range(iter_count):
        y = _ternary(x)
        yr = _ternary(x, sto=True)
        t = t + y
        tr = tr + yr

    plt.plot(x, t / iter_count)
    plt.plot(x, tr / iter_count)
    plt.ylabel("mean (%s samples)" % iter_count)
    plt.show()


if __name__ == "__main__":
    app.run(main)

`example_mnist.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""uses po2."""



import keras.ops.numpy as knp
from keras.datasets import mnist
from keras.layers import *
from keras.layers import Activation, Flatten, Input
from keras.models import Model
from keras.optimizers import Adam
from keras.utils import to_categorical

from qkeras import *
from qkeras.utils import model_save_quantized_weights

NB_EPOCH = 10
BATCH_SIZE = 64
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001, decay=0.000025)
VALIDATION_SPLIT = 0.1

train = 1

(x_train, y_train), (x_test, y_test) = mnist.load_data()

RESHAPED = 784

x_test_orig = x_test

x_train = x_train.astype(float)
x_test = x_test.astype(float)

x_train = x_train[..., np.newaxis]
x_test = x_test[..., np.newaxis]

x_train /= 256.0
x_test /= 256.0

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

x = x_in = Input(x_train.shape[1:-1] + (1,), name="input")
x = QConv2D(
    32,
    (2, 2),
    strides=(2, 2),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="conv2d_0_m",
)(x)
x = QActivation("quantized_relu(4,0)", name="act0_m")(x)
x = QConv2D(
    64,
    (3, 3),
    strides=(2, 2),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="conv2d_1_m",
)(x)
x = QActivation("quantized_relu(4,0)", name="act1_m")(x)
x = QConv2D(
    64,
    (2, 2),
    strides=(2, 2),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="conv2d_2_m",
)(x)
x = QActivation("quantized_relu(4,0)", name="act2_m")(x)
x = Flatten()(x)
x = QDense(
    NB_CLASSES,
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="dense",
)(x)
x_out = x
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in], outputs=[x])
mo = Model(inputs=[x_in], outputs=[x_out])
model.summary()

model.compile(
    loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
)

if train:
    history = model.fit(
        x_train,
        y_train,
        batch_size=BATCH_SIZE,
        epochs=NB_EPOCH,
        initial_epoch=1,
        verbose=VERBOSE,
        validation_split=VALIDATION_SPLIT,
    )

    outputs = []
    output_names = []

    for layer in model.layers:
        if layer.__class__.__name__ in [
            "QActivation",
            "Activation",
            "QDense",
            "QConv2D",
            "QDepthwiseConv2D",
        ]:
            output_names.append(layer.name)
            outputs.append(layer.output)

    model_debug = Model(inputs=[x_in], outputs=outputs)

    outputs = model_debug.predict(x_train)

    print("{:30} {: 8.4f} {: 8.4f}".format("input", knp.min(x_train), knp.max(x_train)))

    for n, p in zip(output_names, outputs):
        print(f"{n:30} {knp.min(p): 8.4f} {knp.max(p): 8.4f}", end="")
        layer = model.get_layer(n)
        for i, weights in enumerate(layer.get_weights()):
            weights = layer.get_quantizers()[i](weights)
            print(
                f" ({knp.min(weights): 8.4f} {knp.max(weights): 8.4f})", end=""
            )
            print("")

    p_test = mo.predict(x_test)
    p_test.tofile("p_test.bin")

    score = model.evaluate(x_test, y_test, verbose=VERBOSE)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])

    all_weights = []
    model_save_quantized_weights(model)

    for layer in model.layers:
        for w, weights in enumerate(layer.get_weights()):
            print(layer.name, w)
            all_weights.append(weights.flatten())

    all_weights = np.concatenate(all_weights).astype("float32")
    print(all_weights.size)


for layer in model.layers:
    for w, weight in enumerate(layer.get_weights()):
        print(layer.name, w, weight.shape)

print_qstats(model)

`example_qoctave.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""QOctave example."""

from keras import initializers
from keras import ops as Kops
from keras.layers import Activation, Input, UpSampling2D
from keras.models import Model

from qkeras import *  # pylint: disable=wildcard-import


def create_model():
    """use qocatve in network."""
    kernel_initializer = initializers.he_normal(seed=42)

    x = x_in = Input(shape=(256, 256, 3))

    # Block 1
    high, low = QOctaveConv2D(
        32,
        (3, 3),
        alpha=0.5,
        strides=(2, 2),
        padding="valid",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block1_conv1",
    )([x, None])

    # Block 2
    high, low = QOctaveConv2D(
        64,
        (3, 3),
        alpha=0.4,
        strides=(2, 2),
        padding="same",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block2_conv1",
    )([high, low])

    # Block 3
    high, low = QOctaveConv2D(
        64,
        (3, 3),
        alpha=0.4,
        strides=(2, 2),
        padding="same",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block3_conv1",
    )([high, low])

    high, low = QOctaveConv2D(
        32,
        (3, 3),
        alpha=0.4,
        strides=(1, 1),
        padding="same",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block3_conv2",
    )([high, low])

    high, low = QOctaveConv2D(
        32,
        (3, 3),
        alpha=0.3,
        strides=(1, 1),
        padding="same",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block3_conv3",
    )([high, low])

    x, _ = QOctaveConv2D(
        32,
        (3, 3),
        alpha=0.0,
        strides=(2, 2),
        padding="same",
        kernel_initializer=kernel_initializer,
        bias_initializer="zeros",
        bias_quantizer="quantized_bits(4,1)",
        depthwise_quantizer="quantized_bits(4,1)",
        depthwise_activation="quantized_bits(6,2,1)",
        pointwise_quantizer="quantized_bits(4,1)",
        acc_quantizer="quantized_bits(16,7,1)",
        activation="quantized_relu(6,2)",
        use_separable=True,
        name="block3_conv_down",
    )([high, low])

    # Upsample
    x = UpSampling2D(size=(2, 2), data_format="channels_last")(x)

    x = QConv2D(
        2,
        (2, 2),
        strides=(1, 1),
        kernel_initializer=kernel_initializer,
        bias_initializer="ones",
        kernel_quantizer=quantized_bits(4, 0, 1),
        bias_quantizer=quantized_bits(4, 0, 1),
        padding="same",
        name="conv_up",
    )(x)

    x = Activation("softmax", name="softmax")(x)
    output = x

    model = Model(x_in, output, name="qoctave_network")
    return model


@keras.saving.register_keras_serializable()
def customLoss(y_true, y_pred):
    log1 = 1.5 * y_true * Kops.log(y_pred + 1e-9) * keras.ops.power(1 - y_pred, 2)
    log0 = 0.5 * (1 - y_true) * Kops.log((1 - y_pred) + 1e-9) * keras.ops.power(y_pred, 2)
    return -Kops.sum(keras.ops.mean(log0 + log1, axis=0))


if __name__ == "__main__":
    model = create_model()
    model.compile(optimizer="Adam", loss=customLoss, metrics=["acc"])
    model.summary(line_length=100)
    print_qstats(model)

`example_qdense.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests qdense model."""


import argparse

from keras.datasets import mnist
from keras.layers import Activation, Input
from keras.models import Model
from keras.optimizers import Adam
from keras.utils import to_categorical

from qkeras import QActivation, QDense, print_qstats, quantized_bits, ternary

OPTIMIZER = Adam()
NB_EPOCH = 1
BATCH_SIZE = 32
VERBOSE = 1
NB_CLASSES = 10
N_HIDDEN = 100
VALIDATION_SPLIT = 0.1
RESHAPED = 784


def QDenseModel(weights_f, load_weights=False):
    """Construct QDenseModel."""

    x = x_in = Input((RESHAPED,), name="input")
    x = QActivation("quantized_relu(4)", name="act_i")(x)
    x = QDense(
        N_HIDDEN,
        kernel_quantizer=ternary(),
        bias_quantizer=quantized_bits(4, 0, 1),
        name="dense0",
    )(x)
    x = QActivation("quantized_relu(2)", name="act0")(x)
    x = QDense(
        NB_CLASSES,
        kernel_quantizer=quantized_bits(4, 0, 1),
        bias_quantizer=quantized_bits(4, 0, 1),
        name="dense2",
    )(x)
    x = Activation("softmax", name="softmax")(x)

    model = Model(inputs=[x_in], outputs=[x])
    model.summary()
    model.compile(
        loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
    )

    if load_weights and weights_f:
        model.load_weights(weights_f)

    print_qstats(model)
    return model


def UseNetwork(weights_f, load_weights=False):
    """Use DenseModel.

    Args:
      weights_f: weight file location.
      load_weights: load weights when it is True.
    """
    model = QDenseModel(weights_f, load_weights)

    batch_size = BATCH_SIZE
    (x_train_, y_train_), (x_test_, y_test_) = mnist.load_data()

    x_train_ = x_train_.reshape(60000, RESHAPED)
    x_test_ = x_test_.reshape(10000, RESHAPED)
    x_train_ = x_train_.astype(float)
    x_test_ = x_test_.astype(float)

    x_train_ /= 255
    x_test_ /= 255

    print(x_train_.shape[0], "train samples")
    print(x_test_.shape[0], "test samples")

    y_train_ = to_categorical(y_train_, NB_CLASSES)
    y_test_ = to_categorical(y_test_, NB_CLASSES)

    if not load_weights:
        model.fit(
            x_train_,
            y_train_,
            batch_size=batch_size,
            epochs=NB_EPOCH,
            verbose=VERBOSE,
            validation_split=VALIDATION_SPLIT,
        )

        if weights_f:
            model.save_weights(weights_f)

    score = model.evaluate(x_test_, y_test_, verbose=VERBOSE)
    print_qstats(model)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])


def ParserArgs():
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "-l",
        "--load_weight",
        default="0",
        help="""load weights directly from file.
                            0 is to disable and train the network.""",
    )
    parser.add_argument("-w", "--weight_file", default=None)
    a = parser.parse_args()
    return a


if __name__ == "__main__":
    args = ParserArgs()
    lw = False if args.load_weight == "0" else True
    UseNetwork(args.weight_file, load_weights=lw)

`example_keras_to_qkeras.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests automatic conversion of keras model to qkeras."""


from keras.datasets import mnist
from keras.layers import *
from keras.models import Model

from qkeras.estimate import print_qstats
from qkeras.utils import model_quantize, quantized_model_dump

x0 = x_in0 = Input((28, 28, 1), name="input0")
x1 = x_in1 = Input((28, 28, 1), name="input1")
x = Concatenate(name="concat")([x0, x1])
x = Conv2D(128, (3, 3), strides=1, name="conv2d_0_m")(x)
x = Activation("relu", name="act0_m")(x)
x = MaxPooling2D(2, 2, name="mp_0")(x)
x = Conv2D(256, (3, 3), strides=1, name="conv2d_1_m")(x)
x = Activation("relu", name="act1_m")(x)
x = MaxPooling2D(2, 2, name="mp_1")(x)
x = Conv2D(128, (3, 3), strides=1, name="conv2d_2_m")(x)
x = Activation("relu", name="act2_m")(x)
x = MaxPooling2D(2, 2, name="mp_2")(x)
x = Flatten()(x)
x = Dense(10, name="dense")(x)
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in0, x_in1], outputs=[x])
model.summary()

q_dict = {
    "conv2d_0_m": {
        "kernel_quantizer": "binary()",
        "bias_quantizer": "quantized_bits(4,0,1)",
    },
    "conv2d_1_m": {
        "kernel_quantizer": "ternary()",
        "bias_quantizer": "quantized_bits(4,0,1)",
    },
    "act2_m": "quantized_relu(6,2)",
    "QActivation": {"relu": "quantized_relu(4,0)"},
    "QConv2D": {
        "kernel_quantizer": "quantized_bits(4,0,1)",
        "bias_quantizer": "quantized_bits(4,0,1)",
    },
    "QDense": {
        "kernel_quantizer": "quantized_bits(3,0,1)",
        "bias_quantizer": "quantized_bits(3,0,1)",
    },
}

qmodel = model_quantize(model, q_dict, 4)

qmodel.summary()

print_qstats(qmodel)

(x_train, y_train), (x_test, y_test) = mnist.load_data()

x_test_arr = [x_test[0:10, :], x_test[0:10, :]]

quantized_model_dump(
    qmodel,
    x_test_arr,
    layers_to_dump=["input0", "input1", "act2_m", "act1_m", "act0_m"],
)

`example_b2t.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Implements total/partial Binary to Thermometer decoder."""

import numpy as np

from qkeras import BinaryToThermometer

if __name__ == "__main__":
    np.random.seed(42)
    x = np.array(range(8))
    b = BinaryToThermometer(x, 2, 8)
    print(b)
    b = BinaryToThermometer(x, 2, 8, 1)
    print(b)
    b = BinaryToThermometer(x, 2, 8, 1, use_two_hot_encoding=1)
    print(b)
    b = BinaryToThermometer(x, 4, 8)
    print(b)
    b = BinaryToThermometer(x, 4, 8, 1)
    print(b)
    b = BinaryToThermometer(x, 4, 8, 1, use_two_hot_encoding=1)
    print(b)
    x = np.random.randint(0, 255, (100, 28, 28, 1))
    print(x[0, 0, 0:5])
    b = BinaryToThermometer(x, 8, 256, 0)
    print(x.shape, b.shape)
    print(b[0, 0, 0:5])
    b = BinaryToThermometer(x, 8, 256, 1)
    print(b[0, 0, 0:5])
    x = np.random.randint(0, 255, (100, 28, 28, 2))
    b = BinaryToThermometer(x, 8, 256, 0, 1)
    print(x.shape, b.shape)
    print(x[0, 0, 0, 0:2])
    print(b[0, 0, 0, 0:8])
    print(b[0, 0, 0, 8:16])

`example_mnist_prune.py`

`example_mnist_ae.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""uses po2."""



from keras.datasets import mnist
from keras.layers import *
from keras.layers import Activation, Input
from keras.models import Model
from keras.optimizers import Adam
from keras.utils import to_categorical

from qkeras import *

NB_EPOCH = 10
BATCH_SIZE = 64
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001, decay=0.000025)
VALIDATION_SPLIT = 0.1

train = 1

(x_train, y_train), (x_test, y_test) = mnist.load_data()

RESHAPED = 784

x_train = x_train.astype(float)
x_test = x_test.astype(float)

x_train = x_train[..., np.newaxis]
x_test = x_test[..., np.newaxis]

x_train /= 256.0
x_test /= 256.0

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

x = x_in = Input(x_train.shape[1:-1] + (1,))
x = QConv2D(
    32,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2D(
    16,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2D(
    8,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2DTranspose(
    8,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2DTranspose(
    16,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2DTranspose(
    32,
    kernel_size=(3, 3),
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x = QActivation("quantized_relu(4,0)")(x)
x = QConv2D(
    1,
    kernel_size=(3, 3),
    padding="same",
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
)(x)
x_out = x
x = Activation("sigmoid")(x)

model = Model(inputs=[x_in], outputs=[x])
mo = Model(inputs=[x_in], outputs=[x_out])
model.summary()

model.compile(loss="binary_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"])

if train:
    history = model.fit(
        x_train,
        x_train,
        batch_size=BATCH_SIZE,
        epochs=NB_EPOCH,
        initial_epoch=1,
        verbose=VERBOSE,
        validation_split=VALIDATION_SPLIT,
    )

    # Generate reconstructions
    num_reco = 8
    samples = x_test[:num_reco]
    targets = y_test[:num_reco]
    reconstructions = model.predict(samples)


for layer in model.layers:
    for w, weight in enumerate(layer.get_weights()):
        print(layer.name, w, weight.shape)

print_qstats(model)

`example_mnist_bn.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests mnist batchnormalization used as learned scale factor."""

# to run, THRESHOLD=0.05 WITH_BN=1 EPOCHS=5 TRAIN=1 python example_mnist_bn.py



import keras.backend as K
import keras.ops.numpy as knp
from keras import callbacks
from keras.datasets import mnist
from keras.layers import *
from keras.models import Model
from keras.optimizers import *
from keras.utils import to_categorical
from six.moves import zip

from qkeras import *

TRAIN = 1
NB_EPOCH = 2
BATCH_SIZE = 64
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001)
VALIDATION_SPLIT = 0.1
WITH_BN = 1
THRESHOLD = 0.1


class LearningRateAdjuster(callbacks.Callback):
    def __init__(self):
        self.learning_rate_factor = 1.0
        pass

    def on_epoch_end(self, epochs, logs):
        max_variance = -1

        for layer in self.model.layers:
            if layer.__class__.__name__ in [
                "BatchNormalization",
                "QBatchNormalization",
            ]:
                variance = knp.max(layer.get_weights()[-1])
                max_variance = max(variance, max_variance)

        if max_variance > 32 and self.learning_rate_factor < 100:
            learning_rate = K.get_value(self.model.optimizer.learning_rate)
            self.learning_rate_factor /= 2.0
            print(
                f"***** max_variance is {max_variance} / lr is {learning_rate} *****"
            )
            K.eval(K.update(self.model.optimizer.learning_rate, learning_rate / 2.0))


lra = LearningRateAdjuster()

(x_train, y_train), (x_test, y_test) = mnist.load_data()

x_train = x_train.reshape(x_train.shape + (1,)).astype(float)
x_test = x_test.reshape(x_test.shape + (1,)).astype(float)

x_train /= 256.0
x_test /= 256.0

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

x = x_in = Input(x_train.shape[1:], name="input")
# x = QActivation("quantized_relu_po2(4,1)", name="acti")(x)
x = QConv2D(
    128,
    (3, 3),
    strides=1,
    kernel_quantizer=ternary(),  # quantized_po2(4, 1),
    bias_quantizer=quantized_bits(4, 2, 0) if not WITH_BN else None,
    bias_range=4 if not WITH_BN else None,
    use_bias=not WITH_BN,
    name="conv2d_0_m",
)(x)
if WITH_BN:
    x = QBatchNormalization(
        gamma_quantizer=quantized_relu_po2(4, 8),
        variance_quantizer=quantized_relu_po2(6),
        beta_quantizer=quantized_po2(4, 4),
        gamma_range=8,
        beta_range=4,
        name="bn0",
    )(x)
x = QActivation("quantized_relu(3,1)", name="act0_m")(x)
x = MaxPooling2D(2, 2, name="mp_0")(x)
x = QConv2D(
    256,
    (3, 3),
    strides=1,
    kernel_quantizer=ternary(),  # quantized_bits(2,0,1),
    bias_quantizer=quantized_bits(4, 2, 1) if not WITH_BN else None,
    bias_range=4 if not WITH_BN else None,
    use_bias=not WITH_BN,
    name="conv2d_1_m",
)(x)
if WITH_BN:
    x = QBatchNormalization(
        gamma_quantizer=quantized_relu_po2(4, 8),
        variance_quantizer=quantized_relu_po2(6),
        beta_quantizer=quantized_po2(4, 4),
        gamma_range=8,
        beta_range=4,
        name="bn1",
    )(x)
x = QActivation("quantized_relu(3,1)", name="act1_m")(x)
x = MaxPooling2D(2, 2, name="mp_1")(x)
x = QConv2D(
    128,
    (3, 3),
    strides=1,
    kernel_quantizer=ternary(),  # quantized_bits(2,0,1),
    bias_quantizer=quantized_bits(4, 2, 1) if not WITH_BN else None,
    bias_range=4 if not WITH_BN else None,
    use_bias=not WITH_BN,
    name="conv2d_2_m",
)(x)
if WITH_BN:
    x = QBatchNormalization(
        gamma_quantizer=quantized_relu_po2(4, 8),
        variance_quantizer=quantized_relu_po2(6),
        beta_quantizer=quantized_po2(4, 4),
        gamma_range=8,
        beta_range=4,
        name="bn2",
    )(x)
x = QActivation("quantized_relu(3,1)", name="act2_m")(x)
x = MaxPooling2D(2, 2, name="mp_2")(x)
x = Flatten()(x)
x = QDense(
    NB_CLASSES,
    kernel_quantizer=quantized_ulaw(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="dense",
)(x)
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in], outputs=[x])
model.summary()

model.compile(
    loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
)


if TRAIN:
    history = model.fit(
        x_train,
        y_train,
        batch_size=BATCH_SIZE,
        epochs=NB_EPOCH,
        initial_epoch=1,
        verbose=VERBOSE,
        validation_split=VALIDATION_SPLIT,
        callbacks=[],
    )  # lra])

    outputs = []
    output_names = []

    for layer in model.layers:
        if layer.__class__.__name__ in [
            "QActivation",
            "QBatchNormalization",
            "Activation",
            "QDense",
            "QConv2D",
            "QDepthwiseConv2D",
        ]:
            output_names.append(layer.name)
            outputs.append(layer.output)

    model_debug = Model(inputs=[x_in], outputs=outputs)

    outputs = model_debug.predict(x_train)

    print("{:30} {: 8.4f} {: 8.4f}".format("input", knp.min(x_train), knp.max(x_train)))

    for n, p in zip(output_names, outputs):
        print(f"{n:30} {knp.min(p): 8.4f} {knp.max(p): 8.4f}", end="")
        layer = model.get_layer(n)
        for i, weights in enumerate(layer.get_weights()):
            if layer.get_quantizers()[i]:
                weights = K.eval(layer.get_quantizers()[i](K.constant(weights)))
            print(
                f" ({knp.min(weights): 8.4f} {knp.max(weights): 8.4f})", end=""
            )
        print("")

    score = model.evaluate(x_test, y_test, verbose=False)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])

print_qstats(model)

`example_mnist_b2t.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests qcore model with BinaryToThermometer."""


import os

import keras.ops.numpy as knp
from keras.datasets import mnist
from keras.layers import *
from keras.layers import Activation, Flatten, Input
from keras.models import Model
from keras.optimizers import Adam
from keras.utils import to_categorical

from qkeras import *

NB_EPOCH = 20
BATCH_SIZE = 32
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001)
N_HIDDEN = 100
VALIDATION_SPLIT = 0.1

T_CLASSES = 256
T_WITH_RESIDUE = 0

(x_train, y_train), (x_test, y_test) = mnist.load_data()

RESHAPED = 784

x_train = x_train.astype(float)
x_test = x_test.astype(float)

x_train = x_train[..., np.newaxis]
x_test = x_test[..., np.newaxis]

if T_CLASSES == 1:
    x_train /= 256.0
    x_test /= 256.0

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

# x_train = x_train[0:1000]
# y_train = y_train[0:1000]
# x_test = x_test[0:100]
# y_test = y_test[0:100]

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

# we ran out of memory here, so we split x_train/x_test into smaller groups

x = x_in = Input(x_train.shape[1:-1] + (T_CLASSES,), name="input")

# Number is represented as 1.bbb, where number of bits of bbb is
# log2(256/T_CLASSES) if T_WITH_RESIDUE == 1

bits = (T_WITH_RESIDUE == 1) * int(knp.ceil(knp.log2(256 / T_CLASSES))) + (T_CLASSES > 1)

print(f"Input quantizer: quantized_relu({bits},{int(T_CLASSES > 1)})")
x = QActivation(f"quantized_relu({bits},{int(T_CLASSES > 1)})")(x)
x = QConv2D(
    64,
    (3, 3),
    strides=1,
    padding="same",
    kernel_quantizer=quantized_po2(4, 1),
    bias_quantizer=quantized_bits(4, 2, 1),
    bias_range=4,
    name="conv2d_0_m",
)(x)
x = QActivation("quantized_relu(4,0)", name="act0_m")(x)
x = MaxPooling2D(2, 2, name="mp_0")(x)
x = QConv2D(
    32,
    (3, 3),
    strides=1,
    padding="same",
    kernel_quantizer=stochastic_ternary(),
    bias_quantizer=quantized_bits(8, 5, 1),
    bias_range=32,
    name="conv2d_1_m",
)(x)
x = QActivation("quantized_relu(4,0)", name="act1_m")(x)
x = MaxPooling2D(2, 2, name="mp_1")(x)
x = QConv2D(
    16,
    (3, 3),
    strides=1,
    padding="same",
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(8, 5, 1),
    bias_range=32,
    name="conv2d_2_m",
)(x)
x = QActivation("quantized_relu(6,2)", name="act2_m")(x)
x = MaxPooling2D(2, 2, name="mp_2")(x)
x = Flatten()(x)
x = QDense(
    NB_CLASSES,
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="dense2",
)(x)
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in], outputs=[x])
model.summary()

model.compile(
    loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
)

outputs = []
output_names = []

for layer in model.layers:
    if layer.__class__.__name__ in [
        "QActivation",
        "Activation",
        "QDense",
        "QConv2D",
        "QDepthwiseConv2D",
    ]:
        output_names.append(layer.name)
        outputs.append(layer.output)

model_debug = Model(inputs=[x_in], outputs=outputs)

batch_size = 1000 * BATCH_SIZE
n_batches = x_train.shape[0] // batch_size

if T_CLASSES > 1:
    x_test = BinaryToThermometer(x_test, T_CLASSES, 256, T_WITH_RESIDUE)

if int(os.environ.get("TRAIN", 0)):
    for i in range(NB_EPOCH):
        for b in range(n_batches):
            min_b = b * batch_size
            max_b = (b + 1) * batch_size
            max_b = min(max_b, x_train.shape[0])

            if T_CLASSES > 1:
                x = BinaryToThermometer(
                    x_train[min_b:max_b], T_CLASSES, 256, T_WITH_RESIDUE
                )
            else:
                x = x_train[min_b:max_b]

            history = model.fit(
                x,
                y_train[min_b:max_b],
                batch_size=BATCH_SIZE,
                epochs=i + 1,
                initial_epoch=i,
                verbose=VERBOSE,
                validation_split=VALIDATION_SPLIT,
            )

    if T_CLASSES > 1:
        x = BinaryToThermometer(x_train[0:100], T_CLASSES, 256, T_WITH_RESIDUE)
    else:
        x = x_train[0:100]

    outputs = model_debug.predict(x)

    print("{:30} {: 8.4f} {: 8.4f}".format("input", knp.min(x), knp.max(x)))
    for n, p in zip(output_names, outputs):
        print(f"{n:30} {knp.min(p): 8.4f} {knp.max(p): 8.4f}", end="")
        layer = model.get_layer(n)
        for i, weights in enumerate(layer.get_weights()):
            weights = layer.get_quantizers()[i](weights)
            print(
                f" ({knp.min(weights): 8.4f} {knp.max(weights): 8.4f})", end=""
            )
        print("")

    score = model.evaluate(x_test, y_test, verbose=VERBOSE)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])

print_qstats(model)

acc = analyze_accumulator_from_sample(model, x_test, mode="sampled")

print(acc)

`example_mnist_po2.py`

# Copyright 2019 Google LLC
#
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Tests qlayers model with po2."""


import keras.backend as K
import keras.ops.numpy as knp
from keras.datasets import mnist
from keras.layers import Activation, Flatten, Input
from keras.models import Model
from keras.optimizers import Adam
from keras.utils import to_categorical

from qkeras import *  # pylint: disable=wildcard-import

NB_EPOCH = 5
BATCH_SIZE = 64
VERBOSE = 1
NB_CLASSES = 10
OPTIMIZER = Adam(learning_rate=0.0001, decay=0.000025)
N_HIDDEN = 100
VALIDATION_SPLIT = 0.1

QUANTIZED = 1
CONV2D = 1

(x_train, y_train), (x_test, y_test) = mnist.load_data()

RESHAPED = 784

x_train = x_train.astype(float)
x_test = x_test.astype(float)

x_train = x_train[..., np.newaxis]
x_test = x_test[..., np.newaxis]

x_train /= 256.0
x_test /= 256.0

train = False

print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")

print(y_train[0:10])

y_train = to_categorical(y_train, NB_CLASSES)
y_test = to_categorical(y_test, NB_CLASSES)

# we ran out of memory here, so we split x_train/x_test into smaller groups

x = x_in = Input(x_train.shape[1:-1] + (1,), name="input")
x = QActivation("quantized_relu_po2(4)", name="acti")(x)
x = QConv2D(
    32,
    (2, 2),
    strides=(2, 2),
    kernel_quantizer=quantized_po2(4, 1),
    bias_quantizer=quantized_po2(4, 1),
    name="conv2d_0_m",
)(x)
x = QActivation("quantized_relu_po2(4,4)", name="act0_m")(x)
x = QConv2D(
    64,
    (3, 3),
    strides=(2, 2),
    kernel_quantizer=quantized_po2(4, 1),
    bias_quantizer=quantized_po2(4, 1),
    name="conv2d_1_m",
)(x)
x = QActivation("quantized_relu_po2(4,4,use_stochastic_rounding=True)", name="act1_m")(
    x
)
x = QConv2D(
    64,
    (2, 2),
    strides=(2, 2),
    kernel_quantizer=quantized_po2(4, 1, use_stochastic_rounding=True),
    bias_quantizer=quantized_po2(4, 1),
    name="conv2d_2_m",
)(x)
x = QActivation("quantized_relu(4,1)", name="act2_m")(x)
x = Flatten()(x)
x = QDense(
    NB_CLASSES,
    kernel_quantizer=quantized_bits(4, 0, 1),
    bias_quantizer=quantized_bits(4, 0, 1),
    name="dense",
)(x)
x = Activation("softmax", name="softmax")(x)

model = Model(inputs=[x_in], outputs=[x])
model.summary()

model.compile(
    loss="categorical_crossentropy", optimizer=OPTIMIZER, metrics=["accuracy"]
)

if train:
    history = model.fit(
        x_train,
        y_train,
        batch_size=BATCH_SIZE,
        epochs=NB_EPOCH,
        initial_epoch=1,
        verbose=VERBOSE,
        validation_split=VALIDATION_SPLIT,
    )

    outputs = []
    output_names = []

    for layer in model.layers:
        if layer.__class__.__name__ in [
            "QActivation",
            "Activation",
            "QDense",
            "QConv2D",
            "QDepthwiseConv2D",
        ]:
            output_names.append(layer.name)
            outputs.append(layer.output)

    model_debug = Model(inputs=[x_in], outputs=outputs)

    outputs = model_debug.predict(x_train)

    print("{:30} {: 8.4f} {: 8.4f}".format("input", knp.min(x_train), knp.max(x_train)))

    for n, p in zip(output_names, outputs):
        print(f"{n:30} {knp.min(p): 8.4f} {knp.max(p): 8.4f}", end="")
        layer = model.get_layer(n)
        for i, weights in enumerate(layer.get_weights()):
            weights = K.eval(layer.get_quantizers()[i](K.constant(weights)))
            print(
                f" ({knp.min(weights): 8.4f} {knp.max(weights): 8.4f})", end=""
            )
            print("")

    score = model.evaluate(x_test, y_test, verbose=VERBOSE)
    print("Test score:", score[0])
    print("Test accuracy:", score[1])

model.summary()

print_qstats(model)

Examples

example_act.py

example_cifar10_po2.py

example_ternary.py

example_mnist.py

example_qoctave.py

example_qdense.py

example_keras_to_qkeras.py

example_b2t.py

example_mnist_prune.py

example_mnist_ae.py

example_mnist_bn.py

example_mnist_b2t.py

example_mnist_po2.py

`example_act.py`

`example_cifar10_po2.py`

`example_ternary.py`

`example_mnist.py`

`example_qoctave.py`

`example_qdense.py`

`example_keras_to_qkeras.py`

`example_b2t.py`

`example_mnist_prune.py`

`example_mnist_ae.py`

`example_mnist_bn.py`

`example_mnist_b2t.py`

`example_mnist_po2.py`