handson-ml/12_custom_models_and_traini...

{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Chapter 12 – Custom Models and Training with TensorFlow**"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "_This notebook contains all the sample code and solutions to the exercises in chapter 12, as well as code examples from Appendix C_"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "<table align=\"left\">\n",
    "  <td>\n",
    "    <a href=\"https://colab.research.google.com/github/ageron/handson-ml3/blob/main/12_custom_models_and_training_with_tensorflow.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>\n",
    "  </td>\n",
    "  <td>\n",
    "    <a target=\"_blank\" href=\"https://kaggle.com/kernels/welcome?src=https://github.com/ageron/handson-ml3/blob/main/12_custom_models_and_training_with_tensorflow.ipynb\"><img src=\"https://kaggle.com/static/images/open-in-kaggle.svg\" /></a>\n",
    "  </td>\n",
    "</table>"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "tags": []
   },
   "source": [
    "# Setup"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "This project requires Python 3.7 or above:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "import sys\n",
    "\n",
    "assert sys.version_info >= (3, 7)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "And TensorFlow ≥ 2.8:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "from packaging import version\n",
    "import tensorflow as tf\n",
    "\n",
    "assert version.parse(tf.__version__) >= version.parse(\"2.8.0\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Using TensorFlow like NumPy"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Tensors and Operations"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Tensors"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
       "array([[1., 2., 3.],\n",
       "       [4., 5., 6.]], dtype=float32)>"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t = tf.constant([[1., 2., 3.], [4., 5., 6.]]) # matrix\n",
    "t"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "TensorShape([2, 3])"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "tf.float32"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t.dtype"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Indexing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
       "array([[2., 3.],\n",
       "       [5., 6.]], dtype=float32)>"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t[:, 1:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 1), dtype=float32, numpy=\n",
       "array([[2.],\n",
       "       [5.]], dtype=float32)>"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t[..., 1, tf.newaxis]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Ops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
       "array([[11., 12., 13.],\n",
       "       [14., 15., 16.]], dtype=float32)>"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t + 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
       "array([[ 1.,  4.,  9.],\n",
       "       [16., 25., 36.]], dtype=float32)>"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.square(t)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
       "array([[14., 32.],\n",
       "       [32., 77.]], dtype=float32)>"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t @ tf.transpose(t)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Scalars"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=42>"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.constant(42)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Keras's low-level API"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "You may still run across code that uses Keras's low-level API:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[11., 26.],\n",
       "       [14., 35.],\n",
       "       [19., 46.]], dtype=float32)>"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "K = tf.keras.backend\n",
    "K.square(K.transpose(t)) + 10"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "But since Keras does not support multiple backends anymore, you should instead use TF's low-level API directly:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[11., 26.],\n",
       "       [14., 35.],\n",
       "       [19., 46.]], dtype=float32)>"
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.square(tf.transpose(t)) + 10"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Tensors and NumPy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3,), dtype=float64, numpy=array([2., 4., 5.])>"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import numpy as np\n",
    "\n",
    "a = np.array([2., 4., 5.])\n",
    "tf.constant(a)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[1., 2., 3.],\n",
       "       [4., 5., 6.]], dtype=float32)"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t.numpy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[1., 2., 3.],\n",
       "       [4., 5., 6.]], dtype=float32)"
      ]
     },
     "execution_count": 16,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.array(t)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3,), dtype=float64, numpy=array([ 4., 16., 25.])>"
      ]
     },
     "execution_count": 17,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.square(a)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[ 1.,  4.,  9.],\n",
       "       [16., 25., 36.]], dtype=float32)"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "np.square(t)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Type Conversions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cannot compute AddV2 as input #1(zero-based) was expected to be a float tensor but is a int32 tensor [Op:AddV2] name: \n"
     ]
    }
   ],
   "source": [
    "try:\n",
    "    tf.constant(2.0) + tf.constant(40)\n",
    "except tf.errors.InvalidArgumentError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "cannot compute AddV2 as input #1(zero-based) was expected to be a float tensor but is a double tensor [Op:AddV2] name: \n"
     ]
    }
   ],
   "source": [
    "try:\n",
    "    tf.constant(2.0) + tf.constant(40., dtype=tf.float64)\n",
    "except tf.errors.InvalidArgumentError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=42.0>"
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t2 = tf.constant(40., dtype=tf.float64)\n",
    "tf.constant(2.0) + tf.cast(t2, tf.float32)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Variables"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'Variable:0' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[1., 2., 3.],\n",
       "       [4., 5., 6.]], dtype=float32)>"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "v = tf.Variable([[1., 2., 3.], [4., 5., 6.]])\n",
    "v"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[ 2.,  4.,  6.],\n",
       "       [ 8., 10., 12.]], dtype=float32)>"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "v.assign(2 * v)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[ 2., 42.,  6.],\n",
       "       [ 8., 10., 12.]], dtype=float32)>"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "v[0, 1].assign(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {
    "tags": []
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[ 2., 42.,  0.],\n",
       "       [ 8., 10.,  1.]], dtype=float32)>"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "v[:, 2].assign([0., 1.])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[100.,  42.,   0.],\n",
       "       [  8.,  10., 200.]], dtype=float32)>"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "v.scatter_nd_update(\n",
    "    indices=[[0, 0], [1, 2]], updates=[100., 200.])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
       "array([[4., 5., 6.],\n",
       "       [1., 2., 3.]], dtype=float32)>"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to use scatter_update()\n",
    "sparse_delta = tf.IndexedSlices(values=[[1., 2., 3.], [4., 5., 6.]],\n",
    "                                indices=[1, 0])\n",
    "v.scatter_update(sparse_delta)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "'ResourceVariable' object does not support item assignment\n"
     ]
    }
   ],
   "source": [
    "try:\n",
    "    v[1] = [7., 8., 9.]\n",
    "except TypeError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Strings"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The code in this section and all the following sections  in appendix C"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=string, numpy=b'hello world'>"
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.constant(b\"hello world\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.constant(\"café\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "u = tf.constant([ord(c) for c in \"café\"])\n",
    "u"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=4>"
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "b = tf.strings.unicode_encode(u, \"UTF-8\")\n",
    "tf.strings.length(b, unit=\"UTF8_CHAR\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.strings.unicode_decode(b, \"UTF-8\")"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Other Data Structures"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The code in this section is in Appendix C."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### String arrays"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=string, numpy=b'hello world'>"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.constant(b\"hello world\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.constant(\"café\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "u = tf.constant([ord(c) for c in \"café\"])\n",
    "u"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "b = tf.strings.unicode_encode(u, \"UTF-8\")\n",
    "b"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=4>"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.strings.length(b, unit=\"UTF8_CHAR\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.strings.unicode_decode(b, \"UTF-8\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [],
   "source": [
    "p = tf.constant([\"Café\", \"Coffee\", \"caffè\", \"咖啡\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([4, 6, 5, 2], dtype=int32)>"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.strings.length(p, unit=\"UTF8_CHAR\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.RaggedTensor [[67, 97, 102, 233], [67, 111, 102, 102, 101, 101],\n",
       " [99, 97, 102, 102, 232], [21654, 21857]]>"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "r = tf.strings.unicode_decode(p, \"UTF8\")\n",
    "r"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Ragged tensors"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(6,), dtype=int32, numpy=array([ 67, 111, 102, 102, 101, 101], dtype=int32)>"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "r[1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.RaggedTensor [[67, 111, 102, 102, 101, 101], [99, 97, 102, 102, 232]]>"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "r[1:3]  # extra code – a slice of a ragged tensor is a ragged tensor"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.RaggedTensor [[67, 97, 102, 233], [67, 111, 102, 102, 101, 101],\n",
       " [99, 97, 102, 102, 232], [21654, 21857], [65, 66], [], [67]]>"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "r2 = tf.ragged.constant([[65, 66], [], [67]])\n",
    "tf.concat([r, r2], axis=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<tf.RaggedTensor [[67, 97, 102, 233, 68, 69, 70], [67, 111, 102, 102, 101, 101, 71],\n",
      " [99, 97, 102, 102, 232], [21654, 21857, 72, 73]]>\n"
     ]
    }
   ],
   "source": [
    "r3 = tf.ragged.constant([[68, 69, 70], [71], [], [72, 73]])\n",
    "print(tf.concat([r, r3], axis=1))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(4, 6), dtype=int32, numpy=\n",
       "array([[   67,    97,   102,   233,     0,     0],\n",
       "       [   67,   111,   102,   102,   101,   101],\n",
       "       [   99,    97,   102,   102,   232,     0],\n",
       "       [21654, 21857,     0,     0,     0,     0]], dtype=int32)>"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "r.to_tensor()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Sparse tensors"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "s = tf.SparseTensor(indices=[[0, 1], [1, 0], [2, 3]],\n",
    "                    values=[1., 2., 3.],\n",
    "                    dense_shape=[3, 4])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 4), dtype=float32, numpy=\n",
       "array([[0., 1., 0., 0.],\n",
       "       [2., 0., 0., 0.],\n",
       "       [0., 0., 0., 3.]], dtype=float32)>"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.sparse.to_dense(s)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "SparseTensor(indices=tf.Tensor(\n",
       "[[0 1]\n",
       " [1 0]\n",
       " [2 3]], shape=(3, 2), dtype=int64), values=tf.Tensor([ 42.  84. 126.], shape=(3,), dtype=float32), dense_shape=tf.Tensor([3 4], shape=(2,), dtype=int64))"
      ]
     },
     "execution_count": 50,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "s * 42.0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "unsupported operand type(s) for +: 'SparseTensor' and 'float'\n"
     ]
    }
   ],
   "source": [
    "try:\n",
    "    s + 42.0\n",
    "except TypeError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[ 30.,  40.],\n",
       "       [ 20.,  40.],\n",
       "       [210., 240.]], dtype=float32)>"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to multiply a sparse tensor and a dense tensor\n",
    "s4 = tf.constant([[10., 20.], [30., 40.], [50., 60.], [70., 80.]])\n",
    "tf.sparse.sparse_dense_matmul(s, s4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{{function_node __wrapped__SparseToDense_device_/job:localhost/replica:0/task:0/device:CPU:0}} indices[1] = [0,1] is out of order. Many sparse ops require sorted indices.\n",
      "    Use `tf.sparse.reorder` to create a correctly ordered copy.\n",
      "\n",
      " [Op:SparseToDense] name: \n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "2023-09-05 11:03:52.814492: W tensorflow/core/framework/op_kernel.cc:1828] OP_REQUIRES failed at sparse_to_dense_op.cc:161 : INVALID_ARGUMENT: indices[1] = [0,1] is out of order. Many sparse ops require sorted indices.\n",
      "    Use `tf.sparse.reorder` to create a correctly ordered copy.\n",
      "\n",
      "\n"
     ]
    }
   ],
   "source": [
    "# extra code – when creating a sparse tensor, values must be given in \"reading\n",
    "#              order\", or else `to_dense()` will fail.\n",
    "s5 = tf.SparseTensor(indices=[[0, 2], [0, 1]],  # WRONG ORDER!\n",
    "                     values=[1., 2.],\n",
    "                     dense_shape=[3, 4])\n",
    "try:\n",
    "    tf.sparse.to_dense(s5)\n",
    "except tf.errors.InvalidArgumentError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 4), dtype=float32, numpy=\n",
       "array([[0., 2., 1., 0.],\n",
       "       [0., 0., 0., 0.],\n",
       "       [0., 0., 0., 0.]], dtype=float32)>"
      ]
     },
     "execution_count": 54,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to fix the sparse tensor s5 by reordering its values\n",
    "s6 = tf.sparse.reorder(s5)\n",
    "tf.sparse.to_dense(s6)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Tensor Arrays"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {},
   "outputs": [],
   "source": [
    "array = tf.TensorArray(dtype=tf.float32, size=3)\n",
    "array = array.write(0, tf.constant([1., 2.]))\n",
    "array = array.write(1, tf.constant([3., 10.]))\n",
    "array = array.write(2, tf.constant([5., 7.]))\n",
    "tensor1 = array.read(1)  # returns (and zeros out!) tf.constant([3., 10.])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[1., 2.],\n",
       "       [0., 0.],\n",
       "       [5., 7.]], dtype=float32)>"
      ]
     },
     "execution_count": 56,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "array.stack()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[ 1.,  2.],\n",
       "       [ 3., 10.],\n",
       "       [ 5.,  7.]], dtype=float32)>"
      ]
     },
     "execution_count": 57,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to disable clear_after_read\n",
    "array2 = tf.TensorArray(dtype=tf.float32, size=3, clear_after_read=False)\n",
    "array2 = array2.write(0, tf.constant([1., 2.]))\n",
    "array2 = array2.write(1, tf.constant([3., 10.]))\n",
    "array2 = array2.write(2, tf.constant([5., 7.]))\n",
    "tensor2 = array2.read(1)  # returns tf.constant([3., 10.])\n",
    "array2.stack()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
       "array([[1., 2.],\n",
       "       [0., 0.],\n",
       "       [5., 7.]], dtype=float32)>"
      ]
     },
     "execution_count": 58,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to create and use a tensor array with a dynamic size\n",
    "array3 = tf.TensorArray(dtype=tf.float32, size=0, dynamic_size=True)\n",
    "array3 = array3.write(0, tf.constant([1., 2.]))\n",
    "array3 = array3.write(1, tf.constant([3., 10.]))\n",
    "array3 = array3.write(2, tf.constant([5., 7.]))\n",
    "tensor3 = array3.read(1)\n",
    "array3.stack()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Sets"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "SparseTensor(indices=tf.Tensor(\n",
       "[[0 0]\n",
       " [0 1]\n",
       " [0 2]\n",
       " [0 3]\n",
       " [0 4]], shape=(5, 2), dtype=int64), values=tf.Tensor([ 1  5  6  9 11], shape=(5,), dtype=int32), dense_shape=tf.Tensor([1 5], shape=(2,), dtype=int64))"
      ]
     },
     "execution_count": 59,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "a = tf.constant([[1, 5, 9]])\n",
    "b = tf.constant([[5, 6, 9, 11]])\n",
    "u = tf.sets.union(a, b)\n",
    "u"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(1, 5), dtype=int32, numpy=array([[ 1,  5,  6,  9, 11]], dtype=int32)>"
      ]
     },
     "execution_count": 60,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.sparse.to_dense(u)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 5), dtype=int32, numpy=\n",
       "array([[ 1,  5,  6,  9, 11],\n",
       "       [ 0, 10, 13,  0,  0]], dtype=int32)>"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "a = tf.constant([[1, 5, 9], [10, 0, 0]])\n",
    "b = tf.constant([[5, 6, 9, 11], [13, 0, 0, 0]])\n",
    "u = tf.sets.union(a, b)\n",
    "tf.sparse.to_dense(u)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 5), dtype=int32, numpy=\n",
       "array([[ 1,  5,  6,  9, 11],\n",
       "       [-1, 10, 13, -1, -1]], dtype=int32)>"
      ]
     },
     "execution_count": 62,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to use a different default value: -1 in this case\n",
    "a = tf.constant([[1, 5, 9], [10, -1, -1]])\n",
    "b = tf.constant([[5, 6, 9, 11], [13, -1, -1, -1]])\n",
    "u = tf.sets.union(a, b)\n",
    "tf.sparse.to_dense(u, default_value=-1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 3), dtype=int32, numpy=\n",
       "array([[2, 3, 7],\n",
       "       [7, 0, 0]], dtype=int32)>"
      ]
     },
     "execution_count": 63,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to use `tf.sets.difference()`\n",
    "set1 = tf.constant([[2, 3, 5, 7], [7, 9, 0, 0]])\n",
    "set2 = tf.constant([[4, 5, 6], [9, 10, 0]])\n",
    "tf.sparse.to_dense(tf.sets.difference(set1, set2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(2, 2), dtype=int32, numpy=\n",
       "array([[5, 0],\n",
       "       [0, 9]], dtype=int32)>"
      ]
     },
     "execution_count": 64,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to use `tf.sets.difference()`\n",
    "tf.sparse.to_dense(tf.sets.intersection(set1, set2))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(1,), dtype=bool, numpy=array([ True])>"
      ]
     },
     "execution_count": 65,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – check whether set1[0] contains 5\n",
    "tf.sets.size(tf.sets.intersection(set1[:1], tf.constant([[5, 0, 0, 0]]))) > 0"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Queues"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
      ]
     },
     "execution_count": 66,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "q = tf.queue.FIFOQueue(3, [tf.int32, tf.string], shapes=[(), ()])\n",
    "q.enqueue([10, b\"windy\"])\n",
    "q.enqueue([15, b\"sunny\"])\n",
    "q.size()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 67,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=int32, numpy=10>,\n",
       " <tf.Tensor: shape=(), dtype=string, numpy=b'windy'>]"
      ]
     },
     "execution_count": 67,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "q.dequeue()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "metadata": {},
   "outputs": [],
   "source": [
    "q.enqueue_many([[13, 16], [b'cloudy', b'rainy']])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(3,), dtype=int32, numpy=array([15, 13, 16], dtype=int32)>,\n",
       " <tf.Tensor: shape=(3,), dtype=string, numpy=array([b'sunny', b'cloudy', b'rainy'], dtype=object)>]"
      ]
     },
     "execution_count": 69,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "q.dequeue_many(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Custom loss function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 70,
   "metadata": {},
   "outputs": [],
   "source": [
    "def huber_fn(y_true, y_pred):\n",
    "    error = y_true - y_pred\n",
    "    is_small_error = tf.abs(error) < 1\n",
    "    squared_loss = tf.square(error) / 2\n",
    "    linear_loss  = tf.abs(error) - 0.5\n",
    "    return tf.where(is_small_error, squared_loss, linear_loss)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAqQAAAFkCAYAAAD2RimAAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAA9hAAAPYQGoP6dpAAB5/UlEQVR4nO3dd1xV5R/A8c9lg4IbRQVn7hmWYu49Mi3LmaOyX+YoMzNRK83VMHPkzJWaq9w5McW9cKSZmeZWECcoMi5wfn88XRAB5V7GuRe+79eLl5zDPfd+eTzc+z3PeZ7vY9A0TUMIIYQQQgid2OkdgBBCCCGEyNkkIRVCCCGEELqShFQIIYQQQuhKElIhhBBCCKErSUiFEEIIIYSuJCEVQgghhBC6koRUCCGEEELoShJSIYQQQgihK0lIhRBCCCGEriQhFUKIVIwaNQqDwUBgYKDeoSTTqFEjDAaD3mEIIUSGkIRUCGFTLl26hMFgoFWrVqk+5uDBgxgMBnr37p11gQkhhLCYJKRCCCGEEEJXkpAKIYQQQghdSUIqhMgxSpYsScmSJVP82bPGZP74449UrlwZFxcXfHx88Pf3JyoqKsXHnjx5ki5duuDl5YWTkxMlSpRg4MCB3LlzJ8njTMMPevfuzd9//81rr71GwYIFMRgMXLp0yaLfMTY2lu+//57q1avj6upKnjx5aNy4MRs3bkz22Pj4eObOncuLL75I/vz5cXNzo2TJknTo0IHdu3cneeyqVato2LAhnp6euLi44O3tTatWrVi7dq1FcQohxOMc9A5ACCGs3XfffUdgYCCdO3fm5ZdfZtOmTXz11VccP36czZs3J0lk169fT6dOnbC3t+eVV17B29ubv/76ix9++IGtW7dy6NAh8uXLl+T5z58/T506dahcuTK9evXi7t27ODk5mR2npml07tyZ1atXU65cOfr3709ERAQrV67k5ZdfZsqUKXzwwQcJj/f39+ebb76hTJkydOvWDXd3d65fv86ePXvYsWMHDRo0AGDmzJn069cPLy8vXn31VQoUKEBwcDCHDx9m7dq1dOjQwbKGFUKI/0hCKoSwSefPn2fUqFEp/uzatWsZ+lrbt28nKCiIypUrAzBu3DjatGnD1q1bWbJkCT169ADgzp079OjRg0KFCrFv3z58fHwSnmPZsmV069aNzz//nGnTpiV5/n379vHZZ5/x5ZdfpivOJUuWsHr1aho2bMi2bdsSktoRI0bg6+vLkCFDaNeuHaVKlQJg7ty5FCtWjJMnT+Lm5pbwPJqmce/evYTtuXPn4uTkxB9//EGhQoWSvOaTvb5CCGEJSUiFEDbp33//ZfTo0VnyWj169EhIRgEcHBwYP348AQEB/PTTTwkJ6aJFiwgPD2f69OlJklGArl27MnHiRJYvX54sIS1SpAgjR45Md5wLFy4E4JtvvknSw1q8eHE++ugj/P39+fnnn5O8lpOTEw4OST8KDAYD+fPnT7LP0dERR0fHZK9ZoECBdMcthBCSkAohbFLLli3ZsmVLij87ePAgfn5+GfZa9evXT7avVq1auLq6cuLEiSSva/r3/PnzyY6Jiori9u3b3L59m4IFCybsr169ukW36J90/PhxXF1defHFF5P9rFGjRgBJ4u3UqROzZs2iSpUqdO7cmYYNG+Ln50euXLmSHNupUyeGDRtGlSpV6NKlC40aNaJevXrkzZs33TELIQRIQiqEEM/k6emZ6v7r168nbN+9exeA6dOnP/X5IiIikiSkhQsXzoAoITw8HG9v7xR/VqRIEQDCwsIS9k2dOpXSpUuzcOFCxo4dy9ixY3FxcaFTp0589913CTEOHTqUAgUKMGvWLCZNmsR3332Hg4MDbdq0YfLkyQlDAIQQwlIyy14IkWPY2dkRGxub4s8eT9SeFBoamur+PHnyJGx7eHgAcOrUKTRNS/WrRIkSSZ4no1Zc8vDw4ObNmyn+zLTfFCOo2/CffPIJp0+f5vr16yxdupT69euzaNEiunfvniS+Pn36EBQUxK1bt1izZg2vvfYa69evp23btsTFxWVI/EKInEsSUiFEjpEvXz5CQ0OTJaURERGcO3cu1eP27NmTbF9QUBCRkZHUqFEjYV/t2rUBOHDgQMYEbKaaNWsSGRnJ4cOHk/1s165dAEnifVzRokXp2rUrW7Zs4bnnnmP79u1ERkYme1yBAgXo0KEDK1asoEmTJpw5cybF4QlCCGEOSUiFEDlGrVq1MBqN/Pzzzwn7NE3D39+fiIiIVI9bvHgxp0+fTtiOjY1l+PDhAPTq1Sth/1tvvYW7uzsjRoxI8niTR48eJYwzzQymWPz9/TEajQn7r1+/zqRJk3BwcEjo+YyOjmbHjh1ompbkOSIiInjw4AGOjo7Y29sDsHXr1mRJvNFoTBii4Orqmmm/kxAiZ5AxpEKIHGPAgAEsWLCAPn36EBAQQKFChdizZw/379+nevXq/PHHHyke16xZM+rUqUOXLl3Inz8/mzZt4s8//6Rly5a8+eabCY8rVKgQy5Yt44033qB69eq0atWKChUqEBUVxeXLl9m1axd169ZNdTJWevXo0YPVq1ezbt06qlWrxssvv5xQh/TOnTt89913lC5dGoDIyEiaNm1K6dKlqV27Nj4+Pjx8+JDffvuNkJAQPv3004SJVp07d8bNzY169epRokQJjEYjAQEB/PXXX3Tu3DlZRQEhhDCXJKRCiByjatWqbNmyheHDh/Prr7+SO3du2rRpw7fffkvnzp1TPe7jjz+mXbt2TJkyhX///ZdChQoxbNgwPv/882TjP9u2bcvx48f59ttv2b59OwEBAeTKlYvixYvz1ltvJUlgM5rBYODXX39lypQp/PTTT0ybNg0nJyeef/55Bg8ezCuvvJLw2Fy5cvH111/z+++/s2fPHkJDQ8mXLx8VKlTg66+/TtIeEyZMYMuWLRw+fJgNGzaQK1cuypYty+zZs3n77bcz7fcRQuQcBu3J+zVCCCGEEEJkIRlDKoQQQgghdCUJqRBCCCGE0JUkpEIIIYQQQlfpSkgnTJiAwWBg0KBBT33crl278PX1xcXFhdKlSzNr1qz0vKwQQgghhMhGLE5Ijxw5wpw5c6hWrdpTH3fx4kXatGlD/fr1OX78OMOHD+eDDz5g1apVlr60EEIIIYTIRixKSB8+fEj37t358ccfyZcv31MfO2vWLHx8fJg8eTIVK1akT58+vP3220ycONGigIUQQgghRPZiUR3S/v3707ZtW5o1a8bYsWOf+tgDBw7QokWLJPtatmzJvHnzMBqNODo6JjsmOjqa6OjohO34+Hju3r1LgQIFMmzNZyGEEEIIkXE0TePBgwcULVoUOzvz+jzNTkiXL1/OsWPHOHLkSJoeHxISQuHChZPsK1y4MLGxsdy+fRsvL69kx0yYMIHRo0ebG5oQQgghhNDZ1atXKV68uFnHmJWQXr16lQ8//JBt27bh4uKS5uOe7NU01eJPrbfT39+fwYMHJ2yHhYXh4+PDP//8Q/78+c0JOccyGo3s3LmTxo0bp9gLnRq7WbPQPD3RXnstE6OzXpa2W04mbWa+iIgISpQoAcC///5Lnjx5dI7INsi5Zpmc3G6Ggwexb9eO2O3boXr1NB+Xk9ssPe7evUu5cuVwd3c3+1izEtKjR48SGhqKr69vwr64uDh2797NDz/8QHR0NPb29kmOKVKkCCEhIUn2hYaG4uDgQIECBVJ8HWdnZ5ydnZPtz58/f6rHiKSMRiNubm4UKFDAvD+mESMyLygbYHG75WDSZuZ7/II+f/785M2bV79gbIica5bJ0e3WsCH89BM0agRm3ELO0W2WASwZXmlWQtq0aVNOnTqVZN9bb71FhQoV+PTTT5MlowB+fn5s2LAhyb5t27ZRq1Yt+U+2VhcvwubN0K+f3pEIIYQQlsudG3r00DsKkQZmjTh1d3enSpUqSb5y5cpFgQIFqFKlCqBut/fs2TPhmL59+3L58mUGDx7MmTNnmD9/PvPmzWPIkCEZ+5uIjHPwIHz+Ody9q3ckQgghhGVmzoRRo/SOQqRRhq/UFBwczJUrVxK2S5UqxaZNmwg
      "text/plain": [
       "<Figure size 800x350 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# extra code – shows what the Huber loss looks like\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "plt.figure(figsize=(8, 3.5))\n",
    "z = np.linspace(-4, 4, 200)\n",
    "z_center = np.linspace(-1, 1, 200)\n",
    "plt.plot(z, huber_fn(0, z), \"b-\", linewidth=2, label=\"huber($z$)\")\n",
    "plt.plot(z, z ** 2 / 2, \"r:\", linewidth=1)\n",
    "plt.plot(z_center, z_center ** 2 / 2, \"r\", linewidth=2)\n",
    "plt.plot([-1, -1], [0, huber_fn(0., -1.)], \"k--\")\n",
    "plt.plot([1, 1], [0, huber_fn(0., 1.)], \"k--\")\n",
    "plt.gca().axhline(y=0, color='k')\n",
    "plt.gca().axvline(x=0, color='k')\n",
    "plt.text(2.1, 3.5, r\"$\\frac{1}{2}z^2$\", color=\"r\", fontsize=15)\n",
    "plt.text(3.0, 2.2, r\"$|z| - \\frac{1}{2}$\", color=\"b\", fontsize=15)\n",
    "plt.axis([-4, 4, 0, 4])\n",
    "plt.grid(True)\n",
    "plt.xlabel(\"$z$\")\n",
    "plt.legend(fontsize=14)\n",
    "plt.title(\"Huber loss\", fontsize=14)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "To test our custom loss function, let's create a basic Keras model and train it on the California housing dataset:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 72,
   "metadata": {
    "tags": []
   },
   "outputs": [],
   "source": [
    "# extra code – loads, splits and scales the California housing dataset, then\n",
    "#              creates a simple Keras model\n",
    "\n",
    "from sklearn.datasets import fetch_california_housing\n",
    "from sklearn.model_selection import train_test_split\n",
    "from sklearn.preprocessing import StandardScaler\n",
    "\n",
    "housing = fetch_california_housing()\n",
    "X_train_full, X_test, y_train_full, y_test = train_test_split(\n",
    "    housing.data, housing.target.reshape(-1, 1), random_state=42)\n",
    "X_train, X_valid, y_train, y_valid = train_test_split(\n",
    "    X_train_full, y_train_full, random_state=42)\n",
    "\n",
    "scaler = StandardScaler()\n",
    "X_train_scaled = scaler.fit_transform(X_train)\n",
    "X_valid_scaled = scaler.transform(X_valid)\n",
    "X_test_scaled = scaler.transform(X_test)\n",
    "\n",
    "input_shape = X_train.shape[1:]\n",
    "\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=huber_fn, optimizer=\"nadam\", metrics=[\"mae\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.4858 - mae: 0.8357 - val_loss: 0.3479 - val_mae: 0.6527\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.2415 - mae: 0.5419 - val_loss: 0.2630 - val_mae: 0.5473\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19a5004c0>"
      ]
     },
     "execution_count": 74,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Saving/Loading Models with Custom Objects"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 75,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss/assets\n"
     ]
    }
   ],
   "source": [
    "model.save(\"my_model_with_a_custom_loss\")  # extra code – saving works fine"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss\",\n",
    "                                   custom_objects={\"huber_fn\": huber_fn})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.2052 - mae: 0.4910 - val_loss: 0.2210 - val_mae: 0.4946\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.1888 - mae: 0.4683 - val_loss: 0.2021 - val_mae: 0.4773\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19a876dd0>"
      ]
     },
     "execution_count": 77,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [],
   "source": [
    "def create_huber(threshold=1.0):\n",
    "    def huber_fn(y_true, y_pred):\n",
    "        error = y_true - y_pred\n",
    "        is_small_error = tf.abs(error) < threshold\n",
    "        squared_loss = tf.square(error) / 2\n",
    "        linear_loss  = threshold * tf.abs(error) - threshold ** 2 / 2\n",
    "        return tf.where(is_small_error, squared_loss, linear_loss)\n",
    "    return huber_fn"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=create_huber(2.0), optimizer=\"nadam\", metrics=[\"mae\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.2051 - mae: 0.4598 - val_loss: 0.2249 - val_mae: 0.4582\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.1982 - mae: 0.4531 - val_loss: 0.2035 - val_mae: 0.4527\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19abec4f0>"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_threshold_2/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_threshold_2/assets\n"
     ]
    }
   ],
   "source": [
    "model.save(\"my_model_with_a_custom_loss_threshold_2\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss_threshold_2\",\n",
    "                                   custom_objects={\"huber_fn\": create_huber(2.0)})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.1935 - mae: 0.4465 - val_loss: 0.2020 - val_mae: 0.4410\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.1899 - mae: 0.4422 - val_loss: 0.1867 - val_mae: 0.4399\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19ae75c30>"
      ]
     },
     "execution_count": 83,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [],
   "source": [
    "class HuberLoss(tf.keras.losses.Loss):\n",
    "    def __init__(self, threshold=1.0, **kwargs):\n",
    "        self.threshold = threshold\n",
    "        super().__init__(**kwargs)\n",
    "\n",
    "    def call(self, y_true, y_pred):\n",
    "        error = y_true - y_pred\n",
    "        is_small_error = tf.abs(error) < self.threshold\n",
    "        squared_loss = tf.square(error) / 2\n",
    "        linear_loss  = self.threshold * tf.abs(error) - self.threshold**2 / 2\n",
    "        return tf.where(is_small_error, squared_loss, linear_loss)\n",
    "\n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        return {**base_config, \"threshold\": self.threshold}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {},
   "outputs": [],
   "source": [
    "# extra code – creates another basic Keras model\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=HuberLoss(2.), optimizer=\"nadam\", metrics=[\"mae\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.6492 - mae: 0.8468 - val_loss: 0.5093 - val_mae: 0.6723\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.2912 - mae: 0.5552 - val_loss: 0.3715 - val_mae: 0.5683\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19b1356c0>"
      ]
     },
     "execution_count": 87,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 88,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_class/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_class/assets\n"
     ]
    }
   ],
   "source": [
    "model.save(\"my_model_with_a_custom_loss_class\")  # extra code – saving works"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 89,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss_class\",\n",
    "                                   custom_objects={\"HuberLoss\": HuberLoss})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 90,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.2416 - mae: 0.5034 - val_loss: 0.2922 - val_mae: 0.5057\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.2173 - mae: 0.4774 - val_loss: 0.2503 - val_mae: 0.4843\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19a781c60>"
      ]
     },
     "execution_count": 90,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows that loading worked fine, the model can be used normally\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2.0"
      ]
     },
     "execution_count": 91,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.loss.threshold  # extra code – the treshold was loaded correctly"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Other Custom Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "metadata": {},
   "outputs": [],
   "source": [
    "def my_softplus(z):\n",
    "    return tf.math.log(1.0 + tf.exp(z))\n",
    "\n",
    "def my_glorot_initializer(shape, dtype=tf.float32):\n",
    "    stddev = tf.sqrt(2. / (shape[0] + shape[1]))\n",
    "    return tf.random.normal(shape, stddev=stddev, dtype=dtype)\n",
    "\n",
    "def my_l1_regularizer(weights):\n",
    "    return tf.reduce_sum(tf.abs(0.01 * weights))\n",
    "\n",
    "def my_positive_weights(weights):  # return value is just tf.nn.relu(weights)\n",
    "    return tf.where(weights < 0., tf.zeros_like(weights), weights)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [],
   "source": [
    "layer = tf.keras.layers.Dense(1, activation=my_softplus,\n",
    "                              kernel_initializer=my_glorot_initializer,\n",
    "                              kernel_regularizer=my_l1_regularizer,\n",
    "                              kernel_constraint=my_positive_weights)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 1.4714 - mae: 0.8316 - val_loss: inf - val_mae: inf\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.8094 - mae: 0.6172 - val_loss: 2.6153 - val_mae: 0.6058\n",
      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.6333 - mae: 0.5617 - val_loss: 1.1687 - val_mae: 0.5468\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.5570 - mae: 0.5303 - val_loss: 1.0440 - val_mae: 0.5250\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19b868640>"
      ]
     },
     "execution_count": 94,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – show that building, training, saving, loading, and training again\n",
    "#              works fine with a model containing many custom parts\n",
    "\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1, activation=my_softplus,\n",
    "                          kernel_initializer=my_glorot_initializer,\n",
    "                          kernel_regularizer=my_l1_regularizer,\n",
    "                          kernel_constraint=my_positive_weights)\n",
    "])\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[\"mae\"])\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.save(\"my_model_with_many_custom_parts\")\n",
    "model = tf.keras.models.load_model(\n",
    "    \"my_model_with_many_custom_parts\",\n",
    "    custom_objects={\n",
    "       \"my_l1_regularizer\": my_l1_regularizer,\n",
    "       \"my_positive_weights\": my_positive_weights,\n",
    "       \"my_glorot_initializer\": my_glorot_initializer,\n",
    "       \"my_softplus\": my_softplus,\n",
    "    }\n",
    ")\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {},
   "outputs": [],
   "source": [
    "class MyL1Regularizer(tf.keras.regularizers.Regularizer):\n",
    "    def __init__(self, factor):\n",
    "        self.factor = factor\n",
    "\n",
    "    def __call__(self, weights):\n",
    "        return tf.reduce_sum(tf.abs(self.factor * weights))\n",
    "\n",
    "    def get_config(self):\n",
    "        return {\"factor\": self.factor}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 1.4714 - mae: 0.8316 - val_loss: inf - val_mae: inf\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 998us/step - loss: 0.8094 - mae: 0.6172 - val_loss: 2.6153 - val_mae: 0.6058\n",
      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.6333 - mae: 0.5617 - val_loss: 1.1687 - val_mae: 0.5468\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.5570 - mae: 0.5303 - val_loss: 1.0440 - val_mae: 0.5250\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19b8db610>"
      ]
     },
     "execution_count": 96,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – again, show that everything works fine, this time using our\n",
    "#              custom regularizer class\n",
    "\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1, activation=my_softplus,\n",
    "                          kernel_regularizer=MyL1Regularizer(0.01),\n",
    "                          kernel_constraint=my_positive_weights,\n",
    "                          kernel_initializer=my_glorot_initializer),\n",
    "])\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[\"mae\"])\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.save(\"my_model_with_many_custom_parts\")\n",
    "model = tf.keras.models.load_model(\n",
    "    \"my_model_with_many_custom_parts\",\n",
    "    custom_objects={\n",
    "       \"MyL1Regularizer\": MyL1Regularizer,\n",
    "       \"my_positive_weights\": my_positive_weights,\n",
    "       \"my_glorot_initializer\": my_glorot_initializer,\n",
    "       \"my_softplus\": my_softplus,\n",
    "    }\n",
    ")\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Custom Metrics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {},
   "outputs": [],
   "source": [
    "# extra code – once again, lets' create a basic Keras model\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[create_huber(2.0)])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 844us/step - loss: 1.7474 - huber_fn: 0.6846\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 796us/step - loss: 0.7843 - huber_fn: 0.3136\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19b4fcf10>"
      ]
     },
     "execution_count": 99,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – train the model with our custom metric\n",
    "model.fit(X_train_scaled, y_train, epochs=2)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Note**: if you use the same function as the loss and a metric, you may be surprised to see slightly different results. This is in part because the operations are not computed exactly in the same order, so there might be tiny floating point errors. More importantly, if you use sample weights or class weights, then the equations are a bit different:\n",
    "* the `fit()` method keeps track of the mean of all batch losses seen so far since the start of the epoch. Each batch loss is the sum of the weighted instance losses divided by the _batch size_ (not the sum of weights, so the batch loss is _not_ the weighted mean of the losses).\n",
    "* the metric since the start of the epoch is equal to the sum of weighted instance losses divided by sum of all weights seen so far. In other words, it is the weighted mean of all the instance losses. Not the same thing."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Streaming metrics"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=0.8>"
      ]
     },
     "execution_count": 100,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "precision = tf.keras.metrics.Precision()\n",
    "precision([0, 1, 1, 1, 0, 1, 0, 1], [1, 1, 0, 1, 0, 1, 0, 1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=0.5>"
      ]
     },
     "execution_count": 101,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "precision([0, 1, 0, 0, 1, 0, 1, 1], [1, 0, 1, 1, 0, 0, 0, 0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=0.5>"
      ]
     },
     "execution_count": 102,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "precision.result()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 103,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Variable 'true_positives:0' shape=(1,) dtype=float32, numpy=array([4.], dtype=float32)>,\n",
       " <tf.Variable 'false_positives:0' shape=(1,) dtype=float32, numpy=array([4.], dtype=float32)>]"
      ]
     },
     "execution_count": 103,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "precision.variables"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {},
   "outputs": [],
   "source": [
    "precision.reset_states()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Creating a streaming metric:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 105,
   "metadata": {},
   "outputs": [],
   "source": [
    "class HuberMetric(tf.keras.metrics.Metric):\n",
    "    def __init__(self, threshold=1.0, **kwargs):\n",
    "        super().__init__(**kwargs)  # handles base args (e.g., dtype)\n",
    "        self.threshold = threshold\n",
    "        self.huber_fn = create_huber(threshold)\n",
    "        self.total = self.add_weight(\"total\", initializer=\"zeros\")\n",
    "        self.count = self.add_weight(\"count\", initializer=\"zeros\")\n",
    "\n",
    "    def update_state(self, y_true, y_pred, sample_weight=None):\n",
    "        sample_metrics = self.huber_fn(y_true, y_pred)\n",
    "        self.total.assign_add(tf.reduce_sum(sample_metrics))\n",
    "        self.count.assign_add(tf.cast(tf.size(y_true), tf.float32))\n",
    "\n",
    "    def result(self):\n",
    "        return self.total / self.count\n",
    "\n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        return {**base_config, \"threshold\": self.threshold}"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Extra material** – the rest of this section tests the `HuberMetric` class and shows another implementation subclassing `tf.keras.metrics.Mean`."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 106,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=14.0>"
      ]
     },
     "execution_count": 106,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m = HuberMetric(2.)\n",
    "\n",
    "# total = 2 * |10 - 2| - 2²/2 = 14\n",
    "# count = 1\n",
    "# result = 14 / 1 = 14\n",
    "m(tf.constant([[2.]]), tf.constant([[10.]]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=7.0>"
      ]
     },
     "execution_count": 107,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# total = total + (|1 - 0|² / 2) + (2 * |9.25 - 5| - 2² / 2) = 14 + 7 = 21\n",
    "# count = count + 2 = 3\n",
    "# result = total / count = 21 / 3 = 7\n",
    "m(tf.constant([[0.], [5.]]), tf.constant([[1.], [9.25]]))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=7.0>"
      ]
     },
     "execution_count": 108,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m.result()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Variable 'total:0' shape=() dtype=float32, numpy=21.0>,\n",
       " <tf.Variable 'count:0' shape=() dtype=float32, numpy=3.0>]"
      ]
     },
     "execution_count": 109,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m.variables"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Variable 'total:0' shape=() dtype=float32, numpy=0.0>,\n",
       " <tf.Variable 'count:0' shape=() dtype=float32, numpy=0.0>]"
      ]
     },
     "execution_count": 110,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m.reset_states()\n",
    "m.variables"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Let's check that the `HuberMetric` class works well:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 111,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=create_huber(2.0), optimizer=\"nadam\",\n",
    "              metrics=[HuberMetric(2.0)])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 113,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 886us/step - loss: 0.6492 - huber_metric_1: 0.6492\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 838us/step - loss: 0.2912 - huber_metric_1: 0.2912\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19c2d1300>"
      ]
     },
     "execution_count": 113,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 114,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric/assets\n"
     ]
    }
   ],
   "source": [
    "model.save(\"my_model_with_a_custom_metric\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 115,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.models.load_model(\n",
    "    \"my_model_with_a_custom_metric\",\n",
    "    custom_objects={\n",
    "        \"huber_fn\": create_huber(2.0),\n",
    "        \"HuberMetric\": HuberMetric\n",
    "    }\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 116,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 916us/step - loss: 0.2416 - huber_metric_1: 0.2416\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 859us/step - loss: 0.2173 - huber_metric_1: 0.2173\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19b5f0130>"
      ]
     },
     "execution_count": 116,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "`model.metrics` contains the model's loss followed by the model's metric(s), so the `HuberMetric` is `model.metrics[-1]`:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 117,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2.0"
      ]
     },
     "execution_count": 117,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.metrics[-1].threshold"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Looks like it works fine! More simply, we could have created the class like this:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 118,
   "metadata": {},
   "outputs": [],
   "source": [
    "class HuberMetric(tf.keras.metrics.Mean):\n",
    "    def __init__(self, threshold=1.0, name='HuberMetric', dtype=None):\n",
    "        self.threshold = threshold\n",
    "        self.huber_fn = create_huber(threshold)\n",
    "        super().__init__(name=name, dtype=dtype)\n",
    "\n",
    "    def update_state(self, y_true, y_pred, sample_weight=None):\n",
    "        metric = self.huber_fn(y_true, y_pred)\n",
    "        super(HuberMetric, self).update_state(metric, sample_weight)\n",
    "\n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        return {**base_config, \"threshold\": self.threshold}        "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "This class handles shapes better, and it also supports sample weights."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 119,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 120,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=tf.keras.losses.Huber(2.0), optimizer=\"nadam\",\n",
    "              weighted_metrics=[HuberMetric(2.0)])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 121,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 898us/step - loss: 0.3272 - HuberMetric: 0.6594\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 892us/step - loss: 0.1449 - HuberMetric: 0.2919\n"
     ]
    }
   ],
   "source": [
    "np.random.seed(42)\n",
    "sample_weight = np.random.rand(len(y_train))\n",
    "history = model.fit(X_train_scaled, y_train, epochs=2,\n",
    "                    sample_weight=sample_weight)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 122,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(0.3272010087966919, 0.3272010869771911)"
      ]
     },
     "execution_count": 122,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(history.history[\"loss\"][0],\n",
    " history.history[\"HuberMetric\"][0] * sample_weight.mean())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric_v2/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric_v2/assets\n"
     ]
    }
   ],
   "source": [
    "model.save(\"my_model_with_a_custom_metric_v2\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 124,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.models.load_model(\"my_model_with_a_custom_metric_v2\",\n",
    "                                   custom_objects={\"HuberMetric\": HuberMetric})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 125,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 970us/step - loss: 0.2442 - HuberMetric: 0.2442\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 857us/step - loss: 0.2184 - HuberMetric: 0.2184\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19c576e90>"
      ]
     },
     "execution_count": 125,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 126,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "2.0"
      ]
     },
     "execution_count": 126,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.metrics[-1].threshold"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Custom Layers"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 127,
   "metadata": {},
   "outputs": [],
   "source": [
    "exponential_layer = tf.keras.layers.Lambda(lambda x: tf.exp(x))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 128,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(3,), dtype=float32, numpy=array([0.36787945, 1.        , 2.7182817 ], dtype=float32)>"
      ]
     },
     "execution_count": 128,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – like all layers, it can be used as a function:\n",
    "exponential_layer([-1., 0., 1.])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Adding an exponential layer at the output of a regression model can be useful if the values to predict are positive and with very different scales (e.g., 0.001, 10., 10000)."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 129,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/5\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.7784 - val_loss: 0.4393\n",
      "Epoch 2/5\n",
      "363/363 [==============================] - 0s 891us/step - loss: 0.5702 - val_loss: 0.4094\n",
      "Epoch 3/5\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.4431 - val_loss: 0.3760\n",
      "Epoch 4/5\n",
      "363/363 [==============================] - 0s 921us/step - loss: 0.4984 - val_loss: 0.3785\n",
      "Epoch 5/5\n",
      "363/363 [==============================] - 0s 943us/step - loss: 0.3966 - val_loss: 0.3633\n",
      "162/162 [==============================] - 0s 631us/step - loss: 0.3781\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "0.3781099021434784"
      ]
     },
     "execution_count": 129,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(1),\n",
    "    exponential_layer\n",
    "])\n",
    "model.compile(loss=\"mse\", optimizer=\"sgd\")\n",
    "model.fit(X_train_scaled, y_train, epochs=5,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.evaluate(X_test_scaled, y_test)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Alternatively, it's often preferable to replace the targets with the logarithm of the targets (and use no activation function in the output layer)."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 130,
   "metadata": {},
   "outputs": [],
   "source": [
    "class MyDense(tf.keras.layers.Layer):\n",
    "    def __init__(self, units, activation=None, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.units = units\n",
    "        self.activation = tf.keras.activations.get(activation)\n",
    "\n",
    "    def build(self, batch_input_shape):\n",
    "        self.kernel = self.add_weight(\n",
    "            name=\"kernel\", shape=[batch_input_shape[-1], self.units],\n",
    "            initializer=\"he_normal\")\n",
    "        self.bias = self.add_weight(\n",
    "            name=\"bias\", shape=[self.units], initializer=\"zeros\")\n",
    "\n",
    "    def call(self, X):\n",
    "        return self.activation(X @ self.kernel + self.bias)\n",
    "\n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        return {**base_config, \"units\": self.units,\n",
    "                \"activation\": tf.keras.activations.serialize(self.activation)}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 131,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 3.1183 - val_loss: 6.9549\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.8702 - val_loss: 3.2627\n",
      "162/162 [==============================] - 0s 718us/step - loss: 0.7039\n",
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_layer/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_model_with_a_custom_layer/assets\n"
     ]
    }
   ],
   "source": [
    "# extra code – shows that a custom layer can be used normally\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    MyDense(30, activation=\"relu\", input_shape=input_shape),\n",
    "    MyDense(1)\n",
    "])\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.evaluate(X_test_scaled, y_test)\n",
    "model.save(\"my_model_with_a_custom_layer\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 132,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 0.5945 - val_loss: 0.5318\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.4712 - val_loss: 0.5751\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19cbf39a0>"
      ]
     },
     "execution_count": 132,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows how to load a model with a custom layer\n",
    "model = tf.keras.models.load_model(\"my_model_with_a_custom_layer\",\n",
    "                                   custom_objects={\"MyDense\": MyDense})\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 133,
   "metadata": {},
   "outputs": [],
   "source": [
    "class MyMultiLayer(tf.keras.layers.Layer):\n",
    "    def call(self, X):\n",
    "        X1, X2 = X\n",
    "        print(\"X1.shape: \", X1.shape ,\" X2.shape: \", X2.shape)  # extra code\n",
    "        return X1 + X2, X1 * X2, X1 / X2"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Our custom layer can be called using the functional API like this:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 134,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "X1.shape:  (None, 2)  X2.shape:  (None, 2)\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(<KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>,\n",
       " <KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>,\n",
       " <KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>)"
      ]
     },
     "execution_count": 134,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – tests MyMultiLayer with symbolic inputs\n",
    "inputs1 = tf.keras.layers.Input(shape=[2])\n",
    "inputs2 = tf.keras.layers.Input(shape=[2])\n",
    "MyMultiLayer()((inputs1, inputs2))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Note that the `call()` method receives symbolic inputs, and it returns symbolic outputs. The shapes are only partially specified at this stage: we don't know the batch size, which is why the first dimension is `None`.\n",
    "\n",
    "We can also pass actual data to the custom layer:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "X1.shape:  (2, 2)  X2.shape:  (2, 2)\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
       " array([[ 9., 18.],\n",
       "        [ 6., 10.]], dtype=float32)>,\n",
       " <tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
       " array([[18., 72.],\n",
       "        [ 8., 21.]], dtype=float32)>,\n",
       " <tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
       " array([[0.5      , 0.5      ],\n",
       "        [0.5      , 2.3333333]], dtype=float32)>)"
      ]
     },
     "execution_count": 135,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – tests MyMultiLayer with actual data \n",
    "X1, X2 = np.array([[3., 6.], [2., 7.]]), np.array([[6., 12.], [4., 3.]]) \n",
    "MyMultiLayer()((X1, X2))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Now let's create a layer with a different behavior during training and testing:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 136,
   "metadata": {},
   "outputs": [],
   "source": [
    "class MyGaussianNoise(tf.keras.layers.Layer):\n",
    "    def __init__(self, stddev, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.stddev = stddev\n",
    "\n",
    "    def call(self, X, training=None):\n",
    "        if training:\n",
    "            noise = tf.random.normal(tf.shape(X), stddev=self.stddev)\n",
    "            return X + noise\n",
    "        else:\n",
    "            return X"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Here's a simple model that uses this custom layer:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 137,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 2.2220 - val_loss: 25.1506\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 1.4104 - val_loss: 17.0415\n",
      "162/162 [==============================] - 0s 655us/step - loss: 1.1059\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "1.1058681011199951"
      ]
     },
     "execution_count": 137,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – tests MyGaussianNoise\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([\n",
    "    MyGaussianNoise(stddev=1.0, input_shape=input_shape),\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\",\n",
    "                          kernel_initializer=\"he_normal\"),\n",
    "    tf.keras.layers.Dense(1)\n",
    "])\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.evaluate(X_test_scaled, y_test)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Custom Models"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 138,
   "metadata": {},
   "outputs": [],
   "source": [
    "class ResidualBlock(tf.keras.layers.Layer):\n",
    "    def __init__(self, n_layers, n_neurons, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.hidden = [tf.keras.layers.Dense(n_neurons, activation=\"relu\",\n",
    "                                             kernel_initializer=\"he_normal\")\n",
    "                       for _ in range(n_layers)]\n",
    "\n",
    "    def call(self, inputs):\n",
    "        Z = inputs\n",
    "        for layer in self.hidden:\n",
    "            Z = layer(Z)\n",
    "        return inputs + Z"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 139,
   "metadata": {},
   "outputs": [],
   "source": [
    "class ResidualRegressor(tf.keras.Model):\n",
    "    def __init__(self, output_dim, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.hidden1 = tf.keras.layers.Dense(30, activation=\"relu\",\n",
    "                                             kernel_initializer=\"he_normal\")\n",
    "        self.block1 = ResidualBlock(2, 30)\n",
    "        self.block2 = ResidualBlock(2, 30)\n",
    "        self.out = tf.keras.layers.Dense(output_dim)\n",
    "\n",
    "    def call(self, inputs):\n",
    "        Z = self.hidden1(inputs)\n",
    "        for _ in range(1 + 3):\n",
    "            Z = self.block1(Z)\n",
    "        Z = self.block2(Z)\n",
    "        return self.out(Z)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 140,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 2s 1ms/step - loss: 32.7847\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 1.3612\n",
      "162/162 [==============================] - 0s 713us/step - loss: 1.1603\n",
      "INFO:tensorflow:Assets written to: my_custom_model/assets\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "INFO:tensorflow:Assets written to: my_custom_model/assets\n"
     ]
    }
   ],
   "source": [
    "# extra code – shows that the model can be used normally\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = ResidualRegressor(1)\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
    "history = model.fit(X_train_scaled, y_train, epochs=2)\n",
    "score = model.evaluate(X_test_scaled, y_test)\n",
    "model.save(\"my_custom_model\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 141,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "363/363 [==============================] - 2s 1ms/step - loss: 1.3451\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.7928\n",
      "1/1 [==============================] - 0s 76ms/step\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "array([[1.1431919],\n",
       "       [1.0584592],\n",
       "       [4.71127  ]], dtype=float32)"
      ]
     },
     "execution_count": 141,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – the model can be loaded and you can continue training or use it\n",
    "#              to make predictions\n",
    "model = tf.keras.models.load_model(\"my_custom_model\")\n",
    "history = model.fit(X_train_scaled, y_train, epochs=2)\n",
    "model.predict(X_test_scaled[:3])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We could have defined the model using the sequential API instead:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 142,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)\n",
    "block1 = ResidualBlock(2, 30)\n",
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\",\n",
    "                          kernel_initializer=\"he_normal\"),\n",
    "    block1, block1, block1, block1,\n",
    "    ResidualBlock(2, 30),\n",
    "    tf.keras.layers.Dense(1)\n",
    "])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Losses and Metrics Based on Model Internals"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 143,
   "metadata": {},
   "outputs": [],
   "source": [
    "class ReconstructingRegressor(tf.keras.Model):\n",
    "    def __init__(self, output_dim, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.hidden = [tf.keras.layers.Dense(30, activation=\"relu\",\n",
    "                                             kernel_initializer=\"he_normal\")\n",
    "                       for _ in range(5)]\n",
    "        self.out = tf.keras.layers.Dense(output_dim)\n",
    "        self.reconstruction_mean = tf.keras.metrics.Mean(\n",
    "            name=\"reconstruction_error\")\n",
    "\n",
    "    def build(self, batch_input_shape):\n",
    "        n_inputs = batch_input_shape[-1]\n",
    "        self.reconstruct = tf.keras.layers.Dense(n_inputs)\n",
    "\n",
    "    def call(self, inputs, training=None):\n",
    "        Z = inputs\n",
    "        for layer in self.hidden:\n",
    "            Z = layer(Z)\n",
    "        reconstruction = self.reconstruct(Z)\n",
    "        recon_loss = tf.reduce_mean(tf.square(reconstruction - inputs))\n",
    "        self.add_loss(0.05 * recon_loss)\n",
    "        if training:\n",
    "            result = self.reconstruction_mean(recon_loss)\n",
    "            self.add_metric(result)\n",
    "        return self.out(Z)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 144,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/5\n",
      "363/363 [==============================] - 2s 1ms/step - loss: 0.8198 - reconstruction_error: 1.0892\n",
      "Epoch 2/5\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.4778 - reconstruction_error: 0.5583\n",
      "Epoch 3/5\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.4419 - reconstruction_error: 0.4227\n",
      "Epoch 4/5\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.3852 - reconstruction_error: 0.3587\n",
      "Epoch 5/5\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.3714 - reconstruction_error: 0.3245\n",
      "162/162 [==============================] - 0s 658us/step\n"
     ]
    }
   ],
   "source": [
    "# extra code\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = ReconstructingRegressor(1)\n",
    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
    "history = model.fit(X_train_scaled, y_train, epochs=5)\n",
    "y_pred = model.predict(X_test_scaled)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Computing Gradients Using Autodiff"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 145,
   "metadata": {},
   "outputs": [],
   "source": [
    "def f(w1, w2):\n",
    "    return 3 * w1 ** 2 + 2 * w1 * w2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 146,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "36.000003007075065"
      ]
     },
     "execution_count": 146,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "w1, w2 = 5, 3\n",
    "eps = 1e-6\n",
    "(f(w1 + eps, w2) - f(w1, w2)) / eps"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 147,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "10.000000003174137"
      ]
     },
     "execution_count": 147,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "(f(w1, w2 + eps) - f(w1, w2)) / eps"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 148,
   "metadata": {},
   "outputs": [],
   "source": [
    "w1, w2 = tf.Variable(5.), tf.Variable(3.)\n",
    "with tf.GradientTape() as tape:\n",
    "    z = f(w1, w2)\n",
    "\n",
    "gradients = tape.gradient(z, [w1, w2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 149,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
      ]
     },
     "execution_count": 149,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "gradients"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 150,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "A non-persistent GradientTape can only be used to compute one set of gradients (or jacobians)\n"
     ]
    }
   ],
   "source": [
    "with tf.GradientTape() as tape:\n",
    "    z = f(w1, w2)\n",
    "\n",
    "dz_dw1 = tape.gradient(z, w1)  # returns tensor 36.0\n",
    "try:\n",
    "    dz_dw2 = tape.gradient(z, w2)  # raises a RuntimeError!\n",
    "except RuntimeError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 151,
   "metadata": {},
   "outputs": [],
   "source": [
    "with tf.GradientTape(persistent=True) as tape:\n",
    "    z = f(w1, w2)\n",
    "\n",
    "dz_dw1 = tape.gradient(z, w1)  # returns tensor 36.0\n",
    "dz_dw2 = tape.gradient(z, w2)  # returns tensor 10.0, works fine now!\n",
    "del tape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 152,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>)"
      ]
     },
     "execution_count": 152,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "dz_dw1, dz_dw2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 153,
   "metadata": {},
   "outputs": [],
   "source": [
    "c1, c2 = tf.constant(5.), tf.constant(3.)\n",
    "with tf.GradientTape() as tape:\n",
    "    z = f(c1, c2)\n",
    "\n",
    "gradients = tape.gradient(z, [c1, c2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 154,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[None, None]"
      ]
     },
     "execution_count": 154,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "gradients"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 155,
   "metadata": {},
   "outputs": [],
   "source": [
    "with tf.GradientTape() as tape:\n",
    "    tape.watch(c1)\n",
    "    tape.watch(c2)\n",
    "    z = f(c1, c2)\n",
    "\n",
    "gradients = tape.gradient(z, [c1, c2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 156,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
      ]
     },
     "execution_count": 156,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "gradients"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 157,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=136.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=30.0>]"
      ]
     },
     "execution_count": 157,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – if given a vector, tape.gradient() will compute the gradient of\n",
    "#              the vector's sum.\n",
    "with tf.GradientTape() as tape:\n",
    "    z1 = f(w1, w2 + 2.)\n",
    "    z2 = f(w1, w2 + 5.)\n",
    "    z3 = f(w1, w2 + 7.)\n",
    "\n",
    "tape.gradient([z1, z2, z3], [w1, w2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 158,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=136.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=30.0>]"
      ]
     },
     "execution_count": 158,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows that we get the same result as the previous cell\n",
    "with tf.GradientTape() as tape:\n",
    "    z1 = f(w1, w2 + 2.)\n",
    "    z2 = f(w1, w2 + 5.)\n",
    "    z3 = f(w1, w2 + 7.)\n",
    "    z = z1 + z2 + z3\n",
    "\n",
    "tape.gradient(z, [w1, w2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 159,
   "metadata": {},
   "outputs": [],
   "source": [
    "# extra code – shows how to compute the jacobians and the hessians\n",
    "with tf.GradientTape(persistent=True) as hessian_tape:\n",
    "    with tf.GradientTape() as jacobian_tape:\n",
    "        z = f(w1, w2)\n",
    "    jacobians = jacobian_tape.gradient(z, [w1, w2])\n",
    "hessians = [hessian_tape.gradient(jacobian, [w1, w2])\n",
    "            for jacobian in jacobians]\n",
    "del hessian_tape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 160,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
      ]
     },
     "execution_count": 160,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "jacobians"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 161,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[[<tf.Tensor: shape=(), dtype=float32, numpy=6.0>,\n",
       "  <tf.Tensor: shape=(), dtype=float32, numpy=2.0>],\n",
       " [<tf.Tensor: shape=(), dtype=float32, numpy=2.0>, None]]"
      ]
     },
     "execution_count": 161,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "hessians"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 162,
   "metadata": {},
   "outputs": [],
   "source": [
    "def f(w1, w2):\n",
    "    return 3 * w1 ** 2 + tf.stop_gradient(2 * w1 * w2)\n",
    "\n",
    "with tf.GradientTape() as tape:\n",
    "    z = f(w1, w2)  # same result as without stop_gradient()\n",
    "\n",
    "gradients = tape.gradient(z, [w1, w2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 163,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=30.0>, None]"
      ]
     },
     "execution_count": 163,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "gradients"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 164,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(), dtype=float32, numpy=inf>]"
      ]
     },
     "execution_count": 164,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "x = tf.Variable(1e-50)\n",
    "with tf.GradientTape() as tape:\n",
    "    z = tf.sqrt(x)\n",
    "\n",
    "tape.gradient(z, [x])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 165,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=30.0>"
      ]
     },
     "execution_count": 165,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.math.log(tf.exp(tf.constant(30., dtype=tf.float32)) + 1.)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 166,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor: shape=(1,), dtype=float32, numpy=array([nan], dtype=float32)>]"
      ]
     },
     "execution_count": 166,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "x = tf.Variable([1.0e30])\n",
    "with tf.GradientTape() as tape:\n",
    "    z = my_softplus(x)\n",
    "\n",
    "tape.gradient(z, [x])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 167,
   "metadata": {},
   "outputs": [],
   "source": [
    "def my_softplus(z):\n",
    "    return tf.math.log(1 + tf.exp(-tf.abs(z))) + tf.maximum(0., z)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Here is the proof that this equation is equal to log(1 + exp(_z_)):\n",
    "* softplus(_z_) = log(1 + exp(_z_))\n",
    "* softplus(_z_) = log(1 + exp(_z_)) - log(exp(_z_)) + log(exp(_z_)) ; **just adding and subtracting the same value**\n",
    "* softplus(_z_) = log\\[(1 + exp(_z_)) / exp(_z_)\\] + log(exp(_z_)) ; **since log(_a_) - log(_b_) = log(_a_ / _b_)**\n",
    "* softplus(_z_) = log\\[(1 + exp(_z_)) / exp(_z_)\\] + _z_ ; **since log(exp(_z_)) = _z_**\n",
    "* softplus(_z_) = log\\[1 / exp(_z_) + exp(_z_) / exp(_z_)\\] + _z_ ; **since (1 + _a_) / _b_ = 1 / _b_ + _a_ / _b_**\n",
    "* softplus(_z_) = log\\[exp(–_z_) + 1\\] + _z_ ; **since 1 / exp(_z_) = exp(–z), and exp(_z_) / exp(_z_) = 1**\n",
    "* softplus(_z_) = softplus(–_z_) + _z_ ; **we recognize the definition at the top, but with –_z_**\n",
    "* softplus(_z_) = softplus(–|_z_|) + max(0, _z_) ; **if you consider both cases, _z_ < 0 or _z_ ≥ 0, you will see that this works**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 168,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.custom_gradient\n",
    "def my_softplus(z):\n",
    "    def my_softplus_gradients(grads):  # grads = backprop'ed from upper layers\n",
    "        return grads * (1 - 1 / (1 + tf.exp(z)))  # stable grads of softplus\n",
    "\n",
    "    result = tf.math.log(1 + tf.exp(-tf.abs(z))) + tf.maximum(0., z)\n",
    "    return result, my_softplus_gradients"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 169,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(<tf.Tensor: shape=(1,), dtype=float32, numpy=array([1000.], dtype=float32)>,\n",
       " [<tf.Tensor: shape=(1,), dtype=float32, numpy=array([1.], dtype=float32)>])"
      ]
     },
     "execution_count": 169,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# extra code – shows that the function is now stable, as well as its gradients\n",
    "x = tf.Variable([1000.])\n",
    "with tf.GradientTape() as tape:\n",
    "    z = my_softplus(x)\n",
    "\n",
    "z, tape.gradient(z, [x])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Custom Training Loops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 170,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)  # extra code – to ensure reproducibility\n",
    "l2_reg = tf.keras.regularizers.l2(0.05)\n",
    "model = tf.keras.models.Sequential([\n",
    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
    "                          kernel_regularizer=l2_reg),\n",
    "    tf.keras.layers.Dense(1, kernel_regularizer=l2_reg)\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 171,
   "metadata": {},
   "outputs": [],
   "source": [
    "def random_batch(X, y, batch_size=32):\n",
    "    idx = np.random.randint(len(X), size=batch_size)\n",
    "    return X[idx], y[idx]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 172,
   "metadata": {},
   "outputs": [],
   "source": [
    "def print_status_bar(step, total, loss, metrics=None):\n",
    "    metrics = \" - \".join([f\"{m.name}: {m.result():.4f}\"\n",
    "                          for m in [loss] + (metrics or [])])\n",
    "    end = \"\" if step < total else \"\\n\"\n",
    "    print(f\"\\r{step}/{total} - \" + metrics, end=end)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 173,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 174,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_epochs = 5\n",
    "batch_size = 32\n",
    "n_steps = len(X_train) // batch_size\n",
    "optimizer = tf.keras.optimizers.SGD(learning_rate=0.01)\n",
    "loss_fn = tf.keras.losses.mean_squared_error\n",
    "mean_loss = tf.keras.metrics.Mean()\n",
    "metrics = [tf.keras.metrics.MeanAbsoluteError()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 175,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/5\n",
      "362/362 - mean: 3.5419 - mean_absolute_error: 0.6640\n",
      "Epoch 2/5\n",
      "362/362 - mean: 1.8693 - mean_absolute_error: 0.5431\n",
      "Epoch 3/5\n",
      "362/362 - mean: 1.1428 - mean_absolute_error: 0.5030\n",
      "Epoch 4/5\n",
      "362/362 - mean: 0.8501 - mean_absolute_error: 0.4977\n",
      "Epoch 5/5\n",
      "362/362 - mean: 0.7280 - mean_absolute_error: 0.5014\n"
     ]
    }
   ],
   "source": [
    "for epoch in range(1, n_epochs + 1):\n",
    "    print(f\"Epoch {epoch}/{n_epochs}\")\n",
    "    for step in range(1, n_steps + 1):\n",
    "        X_batch, y_batch = random_batch(X_train_scaled, y_train)\n",
    "        with tf.GradientTape() as tape:\n",
    "            y_pred = model(X_batch, training=True)\n",
    "            main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
    "            loss = tf.add_n([main_loss] + model.losses)\n",
    "\n",
    "        gradients = tape.gradient(loss, model.trainable_variables)\n",
    "        optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
    "\n",
    "        # extra code – if your model has variable constraints\n",
    "        for variable in model.variables:\n",
    "            if variable.constraint is not None:\n",
    "                variable.assign(variable.constraint(variable))\n",
    "\n",
    "        mean_loss(loss)\n",
    "        for metric in metrics:\n",
    "            metric(y_batch, y_pred)\n",
    "\n",
    "        print_status_bar(step, n_steps, mean_loss, metrics)\n",
    "\n",
    "    for metric in [mean_loss] + metrics:\n",
    "        metric.reset_states()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 176,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "28534c4a7baf4b78a8a9f1db10024cfd",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "cd7c0a89c62f476db08f755e6e4f1178",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 1/5:   0%|          | 0/362 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "5866293693b1455584e6a2e28811692a",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 2/5:   0%|          | 0/362 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "84cf94014b644e07b649063016221d3f",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 3/5:   0%|          | 0/362 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "21e3803f4d4249049efc0b725c9bd23f",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 4/5:   0%|          | 0/362 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "c8c0aa7115374ed8891175bafc6f7d0d",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 5/5:   0%|          | 0/362 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# extra code – shows how to use the tqdm package to display nice progress bars\n",
    "\n",
    "from tqdm.notebook import trange\n",
    "from collections import OrderedDict\n",
    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
    "    for epoch in epochs:\n",
    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
    "            for step in steps:\n",
    "                X_batch, y_batch = random_batch(X_train_scaled, y_train)\n",
    "                with tf.GradientTape() as tape:\n",
    "                    y_pred = model(X_batch)\n",
    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
    "                    loss = tf.add_n([main_loss] + model.losses)\n",
    "\n",
    "                gradients = tape.gradient(loss, model.trainable_variables)\n",
    "                optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
    "\n",
    "                for variable in model.variables:\n",
    "                    if variable.constraint is not None:\n",
    "                        variable.assign(variable.constraint(variable))\n",
    "\n",
    "                status = OrderedDict()\n",
    "                mean_loss(loss)\n",
    "                status[\"loss\"] = mean_loss.result().numpy()\n",
    "                for metric in metrics:\n",
    "                    metric(y_batch, y_pred)\n",
    "                    status[metric.name] = metric.result().numpy()\n",
    "\n",
    "                steps.set_postfix(status)\n",
    "\n",
    "        for metric in [mean_loss] + metrics:\n",
    "            metric.reset_states()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## TensorFlow Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 177,
   "metadata": {},
   "outputs": [],
   "source": [
    "def cube(x):\n",
    "    return x ** 3"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 178,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "execution_count": 178,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cube(2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 179,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
      ]
     },
     "execution_count": 179,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cube(tf.constant(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 180,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tensorflow.python.eager.polymorphic_function.polymorphic_function.Function at 0x19db349d0>"
      ]
     },
     "execution_count": 180,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf_cube = tf.function(cube)\n",
    "tf_cube"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 181,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=8>"
      ]
     },
     "execution_count": 181,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf_cube(2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 182,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
      ]
     },
     "execution_count": 182,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf_cube(tf.constant(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 183,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.function\n",
    "def tf_cube(x):\n",
    "    return x ** 3"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Note:** the rest of the code in this section is in appendix D."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### TF Functions and Concrete Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 184,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<ConcreteFunction tf_cube(x) at 0x19F90F400>"
      ]
     },
     "execution_count": 184,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function = tf_cube.get_concrete_function(tf.constant(2.0))\n",
    "concrete_function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 185,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
      ]
     },
     "execution_count": 185,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function(tf.constant(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 186,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 186,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function is tf_cube.get_concrete_function(tf.constant(2.0))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Exploring Function Definitions and Graphs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 187,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "PyGraph<6956689888>"
      ]
     },
     "execution_count": 187,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function.graph"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 188,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Operation 'x' type=Placeholder>,\n",
       " <tf.Operation 'pow/y' type=Const>,\n",
       " <tf.Operation 'pow' type=Pow>,\n",
       " <tf.Operation 'Identity' type=Identity>]"
      ]
     },
     "execution_count": 188,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "ops = concrete_function.graph.get_operations()\n",
    "ops"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 189,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor 'x:0' shape=() dtype=float32>,\n",
       " <tf.Tensor 'pow/y:0' shape=() dtype=float32>]"
      ]
     },
     "execution_count": 189,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pow_op = ops[2]\n",
    "list(pow_op.inputs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 190,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Tensor 'pow:0' shape=() dtype=float32>]"
      ]
     },
     "execution_count": 190,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pow_op.outputs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 191,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Operation 'x' type=Placeholder>"
      ]
     },
     "execution_count": 191,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function.graph.get_operation_by_name('x')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 192,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor 'Identity:0' shape=() dtype=float32>"
      ]
     },
     "execution_count": 192,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function.graph.get_tensor_by_name('Identity:0')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 193,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "name: \"__inference_tf_cube_592407\"\n",
       "input_arg {\n",
       "  name: \"x\"\n",
       "  type: DT_FLOAT\n",
       "}\n",
       "output_arg {\n",
       "  name: \"identity\"\n",
       "  type: DT_FLOAT\n",
       "}"
      ]
     },
     "execution_count": 193,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "concrete_function.function_def.signature"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### How TF Functions Trace Python Functions to Extract Their Computation Graphs"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 194,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.function\n",
    "def tf_cube(x):\n",
    "    print(f\"x = {x}\")\n",
    "    return x ** 3"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 195,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "x = Tensor(\"x:0\", shape=(), dtype=float32)\n"
     ]
    }
   ],
   "source": [
    "result = tf_cube(tf.constant(2.0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 196,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
      ]
     },
     "execution_count": 196,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "result"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 197,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "x = 2\n"
     ]
    }
   ],
   "source": [
    "result = tf_cube(2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 198,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "x = 3\n"
     ]
    }
   ],
   "source": [
    "result = tf_cube(3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 199,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "x = Tensor(\"x:0\", shape=(1, 2), dtype=float32)\n"
     ]
    }
   ],
   "source": [
    "result = tf_cube(tf.constant([[1., 2.]]))  # New shape: trace!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 200,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "x = Tensor(\"x:0\", shape=(2, 2), dtype=float32)\n",
      "WARNING:tensorflow:5 out of the last 5 calls to <function tf_cube at 0x19f910c10> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "WARNING:tensorflow:5 out of the last 5 calls to <function tf_cube at 0x19f910c10> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n"
     ]
    }
   ],
   "source": [
    "result = tf_cube(tf.constant([[3., 4.], [5., 6.]]))  # New shape: trace!"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 201,
   "metadata": {},
   "outputs": [],
   "source": [
    "result = tf_cube(tf.constant([[7., 8.], [9., 10.]]))  # Same shape: no trace"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "It is also possible to specify a particular input signature:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 202,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.function(input_signature=[tf.TensorSpec([None, 28, 28], tf.float32)])\n",
    "def shrink(images):\n",
    "    print(\"Tracing\", images)  # extra code to show when tracing happens\n",
    "    return images[:, ::2, ::2] # drop half the rows and columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 203,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 204,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Tracing Tensor(\"images:0\", shape=(None, 28, 28), dtype=float32)\n"
     ]
    }
   ],
   "source": [
    "img_batch_1 = tf.random.uniform(shape=[100, 28, 28])\n",
    "img_batch_2 = tf.random.uniform(shape=[50, 28, 28])\n",
    "preprocessed_images = shrink(img_batch_1)  # Works fine, traces the function\n",
    "preprocessed_images = shrink(img_batch_2)  # Works fine, same concrete function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 205,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Binding inputs to tf.function `shrink` failed due to `Can not cast TensorSpec(shape=(2, 2, 2), dtype=tf.float32, name=None) to TensorSpec(shape=(None, 28, 28), dtype=tf.float32, name=None)`. Received args: (<tf.Tensor: shape=(2, 2, 2), dtype=float32, numpy=\n",
      "array([[[0.7413678 , 0.62854624],\n",
      "        [0.01738465, 0.3431449 ]],\n",
      "\n",
      "       [[0.51063764, 0.3777541 ],\n",
      "        [0.07321596, 0.02137029]]], dtype=float32)>,) and kwargs: {} for signature: (images: TensorSpec(shape=(None, 28, 28), dtype=tf.float32, name=None)).\n"
     ]
    }
   ],
   "source": [
    "img_batch_3 = tf.random.uniform(shape=[2, 2, 2])\n",
    "try:\n",
    "    preprocessed_images = shrink(img_batch_3)  # TypeError! Incompatible inputs\n",
    "except TypeError as ex:\n",
    "    print(ex)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Using Autograph To Capture Control Flow"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "A \"static\" `for` loop using `range()`:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 206,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.function\n",
    "def add_10(x):\n",
    "    for i in range(10):\n",
    "        x += 1\n",
    "    return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 207,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=15>"
      ]
     },
     "execution_count": 207,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "add_10(tf.constant(5))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 208,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Operation 'x' type=Placeholder>,\n",
       " <tf.Operation 'add/y' type=Const>,\n",
       " <tf.Operation 'add' type=AddV2>,\n",
       " <tf.Operation 'add_1/y' type=Const>,\n",
       " <tf.Operation 'add_1' type=AddV2>,\n",
       " <tf.Operation 'add_2/y' type=Const>,\n",
       " <tf.Operation 'add_2' type=AddV2>,\n",
       " <tf.Operation 'add_3/y' type=Const>,\n",
       " <tf.Operation 'add_3' type=AddV2>,\n",
       " <tf.Operation 'add_4/y' type=Const>,\n",
       " <tf.Operation 'add_4' type=AddV2>,\n",
       " <tf.Operation 'add_5/y' type=Const>,\n",
       " <tf.Operation 'add_5' type=AddV2>,\n",
       " <tf.Operation 'add_6/y' type=Const>,\n",
       " <tf.Operation 'add_6' type=AddV2>,\n",
       " <tf.Operation 'add_7/y' type=Const>,\n",
       " <tf.Operation 'add_7' type=AddV2>,\n",
       " <tf.Operation 'add_8/y' type=Const>,\n",
       " <tf.Operation 'add_8' type=AddV2>,\n",
       " <tf.Operation 'add_9/y' type=Const>,\n",
       " <tf.Operation 'add_9' type=AddV2>,\n",
       " <tf.Operation 'Identity' type=Identity>]"
      ]
     },
     "execution_count": 208,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "add_10.get_concrete_function(tf.constant(5)).graph.get_operations()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "A \"dynamic\" loop using `tf.while_loop()`:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 209,
   "metadata": {},
   "outputs": [],
   "source": [
    "# extra code – shows how to use tf.while_loop (usually @tf.function is simpler)\n",
    "@tf.function\n",
    "def add_10(x):\n",
    "    condition = lambda i, x: tf.less(i, 10)\n",
    "    body = lambda i, x: (tf.add(i, 1), tf.add(x, 1))\n",
    "    final_i, final_x = tf.while_loop(condition, body, [tf.constant(0), x])\n",
    "    return final_x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 210,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=15>"
      ]
     },
     "execution_count": 210,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "add_10(tf.constant(5))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 211,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Operation 'x' type=Placeholder>,\n",
       " <tf.Operation 'Const' type=Const>,\n",
       " <tf.Operation 'while/maximum_iterations' type=Const>,\n",
       " <tf.Operation 'while/loop_counter' type=Const>,\n",
       " <tf.Operation 'while' type=StatelessWhile>,\n",
       " <tf.Operation 'Identity' type=Identity>]"
      ]
     },
     "execution_count": 211,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "add_10.get_concrete_function(tf.constant(5)).graph.get_operations()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "A \"dynamic\" `for` loop using `tf.range()` (captured by autograph):"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 212,
   "metadata": {},
   "outputs": [],
   "source": [
    "@tf.function\n",
    "def add_10(x):\n",
    "    for i in tf.range(10):\n",
    "        x = x + 1\n",
    "    return x"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 213,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[<tf.Operation 'x' type=Placeholder>,\n",
       " <tf.Operation 'range/start' type=Const>,\n",
       " <tf.Operation 'range/limit' type=Const>,\n",
       " <tf.Operation 'range/delta' type=Const>,\n",
       " <tf.Operation 'range' type=Range>,\n",
       " <tf.Operation 'sub' type=Sub>,\n",
       " <tf.Operation 'floordiv' type=FloorDiv>,\n",
       " <tf.Operation 'mod' type=FloorMod>,\n",
       " <tf.Operation 'zeros_like' type=Const>,\n",
       " <tf.Operation 'NotEqual' type=NotEqual>,\n",
       " <tf.Operation 'Cast' type=Cast>,\n",
       " <tf.Operation 'add' type=AddV2>,\n",
       " <tf.Operation 'zeros_like_1' type=Const>,\n",
       " <tf.Operation 'Maximum' type=Maximum>,\n",
       " <tf.Operation 'while/maximum_iterations' type=Const>,\n",
       " <tf.Operation 'while/loop_counter' type=Const>,\n",
       " <tf.Operation 'while' type=StatelessWhile>,\n",
       " <tf.Operation 'Identity' type=Identity>]"
      ]
     },
     "execution_count": 213,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "add_10.get_concrete_function(tf.constant(0)).graph.get_operations()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Handling Variables and Other Resources in TF Functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 214,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
      ]
     },
     "execution_count": 214,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "counter = tf.Variable(0)\n",
    "\n",
    "@tf.function\n",
    "def increment(counter, c=1):\n",
    "    return counter.assign_add(c)\n",
    "\n",
    "increment(counter)  # counter is now equal to 1\n",
    "increment(counter)  # counter is now equal to 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 215,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "name: \"counter\"\n",
       "type: DT_RESOURCE"
      ]
     },
     "execution_count": 215,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "function_def = increment.get_concrete_function(counter).function_def\n",
    "function_def.signature.input_arg[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 216,
   "metadata": {},
   "outputs": [],
   "source": [
    "counter = tf.Variable(0)\n",
    "\n",
    "@tf.function\n",
    "def increment(c=1):\n",
    "    return counter.assign_add(c)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 217,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
      ]
     },
     "execution_count": 217,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "increment()\n",
    "increment()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 218,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "name: \"assignaddvariableop_resource\"\n",
       "type: DT_RESOURCE"
      ]
     },
     "execution_count": 218,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "function_def = increment.get_concrete_function().function_def\n",
    "function_def.signature.input_arg[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 219,
   "metadata": {},
   "outputs": [],
   "source": [
    "class Counter:\n",
    "    def __init__(self):\n",
    "        self.counter = tf.Variable(0)\n",
    "\n",
    "    @tf.function\n",
    "    def increment(self, c=1):\n",
    "        return self.counter.assign_add(c)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 220,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
      ]
     },
     "execution_count": 220,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "c = Counter()\n",
    "c.increment()\n",
    "c.increment()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 221,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "def tf__add(x):\n",
      "    with ag__.FunctionScope('add_10', 'fscope', ag__.ConversionOptions(recursive=True, user_requested=True, optional_features=(), internal_convert_user_code=True)) as fscope:\n",
      "        do_return = False\n",
      "        retval_ = ag__.UndefinedReturnValue()\n",
      "\n",
      "        def get_state():\n",
      "            return (x,)\n",
      "\n",
      "        def set_state(vars_):\n",
      "            nonlocal x\n",
      "            (x,) = vars_\n",
      "\n",
      "        def loop_body(itr):\n",
      "            nonlocal x\n",
      "            i = itr\n",
      "            x = ag__.ld(x)\n",
      "            x += 1\n",
      "        i = ag__.Undefined('i')\n",
      "        ag__.for_stmt(ag__.converted_call(ag__.ld(tf).range, (10,), None, fscope), None, loop_body, get_state, set_state, ('x',), {'iterate_names': 'i'})\n",
      "        try:\n",
      "            do_return = True\n",
      "            retval_ = ag__.ld(x)\n",
      "        except:\n",
      "            do_return = False\n",
      "            raise\n",
      "        return fscope.ret(retval_, do_return)\n",
      "\n"
     ]
    }
   ],
   "source": [
    "@tf.function\n",
    "def add_10(x):\n",
    "    for i in tf.range(10):\n",
    "        x += 1\n",
    "    return x\n",
    "\n",
    "print(tf.autograph.to_code(add_10.python_function))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 222,
   "metadata": {},
   "outputs": [],
   "source": [
    "# extra code – shows how to display the autograph code with syntax highlighting\n",
    "def display_tf_code(func):\n",
    "    from IPython.display import display, Markdown\n",
    "    if hasattr(func, \"python_function\"):\n",
    "        func = func.python_function\n",
    "    code = tf.autograph.to_code(func)\n",
    "    display(Markdown(f'```python\\n{code}\\n```'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 223,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/markdown": [
       "```python\n",
       "def tf__add(x):\n",
       "    with ag__.FunctionScope('add_10', 'fscope', ag__.ConversionOptions(recursive=True, user_requested=True, optional_features=(), internal_convert_user_code=True)) as fscope:\n",
       "        do_return = False\n",
       "        retval_ = ag__.UndefinedReturnValue()\n",
       "\n",
       "        def get_state():\n",
       "            return (x,)\n",
       "\n",
       "        def set_state(vars_):\n",
       "            nonlocal x\n",
       "            (x,) = vars_\n",
       "\n",
       "        def loop_body(itr):\n",
       "            nonlocal x\n",
       "            i = itr\n",
       "            x = ag__.ld(x)\n",
       "            x += 1\n",
       "        i = ag__.Undefined('i')\n",
       "        ag__.for_stmt(ag__.converted_call(ag__.ld(tf).range, (10,), None, fscope), None, loop_body, get_state, set_state, ('x',), {'iterate_names': 'i'})\n",
       "        try:\n",
       "            do_return = True\n",
       "            retval_ = ag__.ld(x)\n",
       "        except:\n",
       "            do_return = False\n",
       "            raise\n",
       "        return fscope.ret(retval_, do_return)\n",
       "\n",
       "```"
      ],
      "text/plain": [
       "<IPython.core.display.Markdown object>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "display_tf_code(add_10)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Using TF Functions with tf.keras (or Not)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "By default, tf.keras will automatically convert your custom code into TF Functions, no need to use\n",
    "`tf.function()`:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 224,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Custom loss function\n",
    "def my_mse(y_true, y_pred):\n",
    "    print(\"Tracing loss my_mse()\")\n",
    "    return tf.reduce_mean(tf.square(y_pred - y_true))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 225,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Custom metric function\n",
    "def my_mae(y_true, y_pred):\n",
    "    print(\"Tracing metric my_mae()\")\n",
    "    return tf.reduce_mean(tf.abs(y_pred - y_true))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 226,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Custom layer\n",
    "class MyDense(tf.keras.layers.Layer):\n",
    "    def __init__(self, units, activation=None, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.units = units\n",
    "        self.activation = tf.keras.activations.get(activation)\n",
    "\n",
    "    def build(self, input_shape):\n",
    "        self.kernel = self.add_weight(name='kernel', \n",
    "                                      shape=(input_shape[1], self.units),\n",
    "                                      initializer='uniform',\n",
    "                                      trainable=True)\n",
    "        self.biases = self.add_weight(name='bias', \n",
    "                                      shape=(self.units,),\n",
    "                                      initializer='zeros',\n",
    "                                      trainable=True)\n",
    "\n",
    "    def call(self, X):\n",
    "        print(\"Tracing MyDense.call()\")\n",
    "        return self.activation(X @ self.kernel + self.biases)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 227,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 228,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Custom model\n",
    "class MyModel(tf.keras.Model):\n",
    "    def __init__(self, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.hidden1 = MyDense(30, activation=\"relu\")\n",
    "        self.hidden2 = MyDense(30, activation=\"relu\")\n",
    "        self.output_ = MyDense(1)\n",
    "\n",
    "    def call(self, input):\n",
    "        print(\"Tracing MyModel.call()\")\n",
    "        hidden1 = self.hidden1(input)\n",
    "        hidden2 = self.hidden2(hidden1)\n",
    "        concat = tf.keras.layers.concatenate([input, hidden2])\n",
    "        output = self.output_(concat)\n",
    "        return output\n",
    "\n",
    "model = MyModel()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 229,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 230,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/2\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "315/363 [=========================>....] - ETA: 0s - loss: 1.5746 - my_mae: 0.8719Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "363/363 [==============================] - 1s 1ms/step - loss: 1.4303 - my_mae: 0.8219 - val_loss: 0.4932 - val_my_mae: 0.4764\n",
      "Epoch 2/2\n",
      "363/363 [==============================] - 0s 1ms/step - loss: 0.4386 - my_mae: 0.4760 - val_loss: 1.0322 - val_my_mae: 0.4793\n",
      "162/162 [==============================] - 0s 704us/step - loss: 0.4204 - my_mae: 0.4711\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "[0.4203692376613617, 0.4711270332336426]"
      ]
     },
     "execution_count": 230,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled, y_train, epochs=2,\n",
    "          validation_data=(X_valid_scaled, y_valid))\n",
    "model.evaluate(X_test_scaled, y_test)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "You can turn this off by creating the model with `dynamic=True` (or calling `super().__init__(dynamic=True, **kwargs)` in the model's constructor):"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 231,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 232,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = MyModel(dynamic=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 233,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Now the custom code will be called at each iteration. Let's fit, validate and evaluate with tiny datasets to avoid getting too much output:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 234,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "[5.545090198516846, 2.0603599548339844]"
      ]
     },
     "execution_count": 234,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled[:64], y_train[:64], epochs=1,\n",
    "          validation_data=(X_valid_scaled[:64], y_valid[:64]), verbose=0)\n",
    "model.evaluate(X_test_scaled[:64], y_test[:64], verbose=0)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Alternatively, you can compile a model with `run_eagerly=True`:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 235,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 236,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = MyModel()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 237,
   "metadata": {},
   "outputs": [],
   "source": [
    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae], run_eagerly=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 238,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n",
      "Tracing MyModel.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing MyDense.call()\n",
      "Tracing loss my_mse()\n",
      "Tracing metric my_mae()\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "[5.545090198516846, 2.0603599548339844]"
      ]
     },
     "execution_count": 238,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "model.fit(X_train_scaled[:64], y_train[:64], epochs=1,\n",
    "          validation_data=(X_valid_scaled[:64], y_valid[:64]), verbose=0)\n",
    "model.evaluate(X_test_scaled[:64], y_test[:64], verbose=0)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Extra Material – Custom Optimizers"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Defining custom optimizers is not very common, but in case you are one of the happy few who gets to write one, here is an example:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 239,
   "metadata": {},
   "outputs": [],
   "source": [
    "class MyMomentumOptimizer(tf.keras.optimizers.Optimizer):\n",
    "    def __init__(self, learning_rate=0.001, momentum=0.9, name=\"MyMomentumOptimizer\", **kwargs):\n",
    "        \"\"\"Gradient descent with momentum optimizer.\"\"\"\n",
    "        super().__init__(name, **kwargs)\n",
    "        self._learning_rate = self._build_learning_rate(learning_rate)\n",
    "        self.momentum = momentum\n",
    "\n",
    "    def build(self, var_list):\n",
    "        \"\"\"Initialize optimizer variables.\n",
    "\n",
    "        Args:\n",
    "          var_list: list of model variables to build SGD variables on.\n",
    "        \"\"\"\n",
    "        super().build(var_list)\n",
    "        if getattr(self, \"_built\", False):\n",
    "            return\n",
    "        self.momentums = []\n",
    "        for var in var_list:\n",
    "            self.momentums.append(\n",
    "                self.add_variable_from_reference(\n",
    "                    model_variable=var, variable_name=\"m\"\n",
    "                )\n",
    "            )\n",
    "        self._built = True\n",
    "\n",
    "    def update_step(self, gradient, variable):\n",
    "        \"\"\"Update step given gradient and the associated model variable.\"\"\"\n",
    "        lr = tf.cast(self.learning_rate, variable.dtype)\n",
    "        m = None\n",
    "        var_key = self._var_key(variable)\n",
    "        momentum = tf.cast(self.momentum, variable.dtype)\n",
    "        m = self.momentums[self._index_dict[var_key]]\n",
    "        if m is None:\n",
    "            variable.assign_add(-gradient * lr)\n",
    "        else:\n",
    "            m.assign(-gradient * lr + m * momentum)\n",
    "            variable.assign_add(m)\n",
    "        \n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        print(\"Config!\")\n",
    "        return {\n",
    "            **base_config,\n",
    "            \"learning_rate\": self._serialize_hyperparameter(self._learning_rate),\n",
    "            \"momentum\": self.momentum,\n",
    "        }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 240,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/5\n",
      "363/363 [==============================] - 0s 660us/step - loss: 1.1844\n",
      "Epoch 2/5\n",
      "363/363 [==============================] - 0s 625us/step - loss: 0.5635\n",
      "Epoch 3/5\n",
      "363/363 [==============================] - 0s 609us/step - loss: 0.9703\n",
      "Epoch 4/5\n",
      "363/363 [==============================] - 0s 627us/step - loss: 0.5678\n",
      "Epoch 5/5\n",
      "363/363 [==============================] - 0s 640us/step - loss: 0.6350\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19c821210>"
      ]
     },
     "execution_count": 240,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "optimizer = MyMomentumOptimizer()\n",
    "\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([tf.keras.layers.Dense(1, input_shape=[8])])\n",
    "model.compile(loss=\"mse\", optimizer=optimizer)\n",
    "model.fit(X_train_scaled, y_train, epochs=5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Let's compare that to Keras's built-in momentum optimizer:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 241,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Epoch 1/5\n",
      "363/363 [==============================] - 0s 645us/step - loss: 1.1844\n",
      "Epoch 2/5\n",
      "363/363 [==============================] - 0s 721us/step - loss: 0.5635\n",
      "Epoch 3/5\n",
      "363/363 [==============================] - 0s 612us/step - loss: 0.9703\n",
      "Epoch 4/5\n",
      "363/363 [==============================] - 0s 625us/step - loss: 0.5678\n",
      "Epoch 5/5\n",
      "363/363 [==============================] - 0s 626us/step - loss: 0.6350\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<keras.src.callbacks.History at 0x19ea8da20>"
      ]
     },
     "execution_count": 241,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "optimizer = tf.keras.optimizers.SGD(learning_rate=0.001, momentum=0.9)\n",
    "\n",
    "tf.keras.utils.set_random_seed(42)\n",
    "model = tf.keras.Sequential([tf.keras.layers.Dense(1, input_shape=[8])])\n",
    "model.compile(loss=\"mse\", optimizer=optimizer)\n",
    "model.fit(X_train_scaled, y_train, epochs=5)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Yep, we get the exact same model! 👍"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Exercises"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 1. to 11."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "1. TensorFlow is an open-source library for numerical computation, particularly well suited and fine-tuned for large-scale Machine Learning. Its core is similar to NumPy, but it also features GPU support, support for distributed computing, computation graph analysis and optimization capabilities (with a portable graph format that allows you to train a TensorFlow model in one environment and run it in another), an optimization API based on reverse-mode autodiff, and several powerful APIs such as tf.keras, tf.data, tf.image, tf.signal, and more. Other popular Deep Learning libraries include PyTorch, MXNet, Microsoft Cognitive Toolkit, Theano, Caffe2, and Chainer.\n",
    "2. Although TensorFlow offers most of the functionalities provided by NumPy, it is not a drop-in replacement, for a few reasons. First, the names of the functions are not always the same (for example, `tf.reduce_sum()` versus `np.sum()`). Second, some functions do not behave in exactly the same way (for example, `tf.transpose()` creates a transposed copy of a tensor, while NumPy's `T` attribute creates a transposed view, without actually copying any data). Lastly, NumPy arrays are mutable, while TensorFlow tensors are not (but you can use a `tf.Variable` if you need a mutable object).\n",
    "3. Both `tf.range(10)` and `tf.constant(np.arange(10))` return a one-dimensional tensor containing the integers 0 to 9. However, the former uses 32-bit integers while the latter uses 64-bit integers. Indeed, TensorFlow defaults to 32 bits, while NumPy defaults to 64 bits.\n",
    "4. Beyond regular tensors, TensorFlow offers several other data structures, including sparse tensors, tensor arrays, ragged tensors, queues, string tensors, and sets. The last two are actually represented as regular tensors, but TensorFlow provides special functions to manipulate them (in `tf.strings` and `tf.sets`).\n",
    "5. When you want to define a custom loss function, in general you can just implement it as a regular Python function. However, if your custom loss function must support some hyperparameters (or any other state), then you should subclass the `keras.losses.Loss` class and implement the `__init__()` and `call()` methods. If you want the loss function's hyperparameters to be saved along with the model, then you must also implement the `get_config()` method.\n",
    "6. Much like custom loss functions, most metrics can be defined as regular Python functions. But if you want your custom metric to support some hyperparameters (or any other state), then you should subclass the `keras.metrics.Metric` class. Moreover, if computing the metric over a whole epoch is not equivalent to computing the mean metric over all batches in that epoch (e.g., as for the precision and recall metrics), then you should subclass the `keras.metrics.Metric` class and implement the `__init__()`, `update_state()`, and `result()` methods to keep track of a running metric during each epoch. You should also implement the `reset_states()` method unless all it needs to do is reset all variables to 0.0. If you want the state to be saved along with the model, then you should implement the `get_config()` method as well.\n",
    "7. You should distinguish the internal components of your model (i.e., layers or reusable blocks of layers) from the model itself (i.e., the object you will train). The former should subclass the `keras.layers.Layer` class, while the latter should subclass the `keras.models.Model` class.\n",
    "8. Writing your own custom training loop is fairly advanced, so you should only do it if you really need to. Keras provides several tools to customize training without having to write a custom training loop: callbacks, custom regularizers, custom constraints, custom losses, and so on. You should use these instead of writing a custom training loop whenever possible: writing a custom training loop is more error-prone, and it will be harder to reuse the custom code you write. However, in some cases writing a custom training loop is necessary⁠—for example, if you want to use different optimizers for different parts of your neural network, like in the [Wide & Deep paper](https://homl.info/widedeep). A custom training loop can also be useful when debugging, or when trying to understand exactly how training works.\n",
    "9. Custom Keras components should be convertible to TF Functions, which means they should stick to TF operations as much as possible and respect all the rules listed in Chapter 12 (in the _TF Function Rules_ section). If you absolutely need to include arbitrary Python code in a custom component, you can either wrap it in a `tf.py_function()` operation (but this will reduce performance and limit your model's portability) or set `dynamic=True` when creating the custom layer or model (or set `run_eagerly=True` when calling the model's `compile()` method).\n",
    "10. Please refer to Chapter 12 for the list of rules to respect when creating a TF Function (in the _TF Function Rules_ section).\n",
    "11. Creating a dynamic Keras model can be useful for debugging, as it will not compile any custom component to a TF Function, and you can use any Python debugger to debug your code. It can also be useful if you want to include arbitrary Python code in your model (or in your training code), including calls to external libraries. To make a model dynamic, you must set `dynamic=True` when creating it. Alternatively, you can set `run_eagerly=True` when calling the model's `compile()` method. Making a model dynamic prevents Keras from using any of TensorFlow's graph features, so it will slow down training and inference, and you will not have the possibility to export the computation graph, which will limit your model's portability."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 12. Implement a custom layer that performs _Layer Normalization_\n",
    "_We will use this type of layer in Chapter 15 when using Recurrent Neural Networks._"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### a.\n",
    "_Exercise: The `build()` method should define two trainable weights *α* and *β*, both of shape `input_shape[-1:]` and data type `tf.float32`. *α* should be initialized with 1s, and *β* with 0s._"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Solution: see below."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### b.\n",
    "_Exercise: The `call()` method should compute the mean_ μ _and standard deviation_ σ _of each instance's features. For this, you can use `tf.nn.moments(inputs, axes=-1, keepdims=True)`, which returns the mean μ and the variance σ<sup>2</sup> of all instances (compute the square root of the variance to get the standard deviation). Then the function should compute and return *α*⊗(*X* - μ)/(σ + ε) + *β*, where ⊗ represents itemwise multiplication (`*`) and ε is a smoothing term (small constant to avoid division by zero, e.g., 0.001)._"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 242,
   "metadata": {},
   "outputs": [],
   "source": [
    "class LayerNormalization(tf.keras.layers.Layer):\n",
    "    def __init__(self, eps=0.001, **kwargs):\n",
    "        super().__init__(**kwargs)\n",
    "        self.eps = eps\n",
    "\n",
    "    def build(self, batch_input_shape):\n",
    "        self.alpha = self.add_weight(\n",
    "            name=\"alpha\", shape=batch_input_shape[-1:],\n",
    "            initializer=\"ones\")\n",
    "        self.beta = self.add_weight(\n",
    "            name=\"beta\", shape=batch_input_shape[-1:],\n",
    "            initializer=\"zeros\")\n",
    "\n",
    "    def call(self, X):\n",
    "        mean, variance = tf.nn.moments(X, axes=-1, keepdims=True)\n",
    "        return self.alpha * (X - mean) / (tf.sqrt(variance + self.eps)) + self.beta\n",
    "\n",
    "    def get_config(self):\n",
    "        base_config = super().get_config()\n",
    "        return {**base_config, \"eps\": self.eps}"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Note that making _ε_ a hyperparameter (`eps`) was not compulsory. Also note that it's preferable to compute `tf.sqrt(variance + self.eps)` rather than `tf.sqrt(variance) + self.eps`. Indeed, the derivative of sqrt(z) is undefined when z=0, so training will bomb whenever the variance vector has at least one component equal to 0. Adding _ε_ within the square root guarantees that this will never happen."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### c.\n",
    "_Exercise: Ensure that your custom layer produces the same (or very nearly the same) output as the `tf.keras.layers.LayerNormalization` layer._"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Let's create one instance of each class, apply them to some data (e.g., the training set), and ensure that the difference is negligeable."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 243,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=3.9782837e-08>"
      ]
     },
     "execution_count": 243,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "X = X_train.astype(np.float32)\n",
    "\n",
    "custom_layer_norm = LayerNormalization()\n",
    "keras_layer_norm = tf.keras.layers.LayerNormalization()\n",
    "\n",
    "tf.reduce_mean(tf.keras.losses.mean_absolute_error(\n",
    "    keras_layer_norm(X), custom_layer_norm(X)))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Yep, that's close enough. To be extra sure, let's make alpha and beta completely random and compare again:"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 244,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<tf.Tensor: shape=(), dtype=float32, numpy=1.764704e-08>"
      ]
     },
     "execution_count": 244,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tf.keras.utils.set_random_seed(42)\n",
    "random_alpha = np.random.rand(X.shape[-1])\n",
    "random_beta = np.random.rand(X.shape[-1])\n",
    "\n",
    "custom_layer_norm.set_weights([random_alpha, random_beta])\n",
    "keras_layer_norm.set_weights([random_alpha, random_beta])\n",
    "\n",
    "tf.reduce_mean(tf.keras.losses.mean_absolute_error(\n",
    "    keras_layer_norm(X), custom_layer_norm(X)))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Still a negligeable difference! Our custom layer works fine."
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 13. Train a model using a custom training loop to tackle the Fashion MNIST dataset\n",
    "_The Fashion MNIST dataset was introduced in Chapter 10._"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### a.\n",
    "_Exercise: Display the epoch, iteration, mean training loss, and mean accuracy over each epoch (updated at each iteration), as well as the validation loss and accuracy at the end of each epoch._"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 245,
   "metadata": {},
   "outputs": [],
   "source": [
    "(X_train_full, y_train_full), (X_test, y_test) = tf.keras.datasets.fashion_mnist.load_data()\n",
    "X_train_full = X_train_full.astype(np.float32) / 255.\n",
    "X_valid, X_train = X_train_full[:5000], X_train_full[5000:]\n",
    "y_valid, y_train = y_train_full[:5000], y_train_full[5000:]\n",
    "X_test = X_test.astype(np.float32) / 255."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 246,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 247,
   "metadata": {},
   "outputs": [],
   "source": [
    "model = tf.keras.Sequential([\n",
    "    tf.keras.layers.Flatten(input_shape=[28, 28]),\n",
    "    tf.keras.layers.Dense(100, activation=\"relu\"),\n",
    "    tf.keras.layers.Dense(10, activation=\"softmax\"),\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 248,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_epochs = 5\n",
    "batch_size = 32\n",
    "n_steps = len(X_train) // batch_size\n",
    "optimizer = tf.keras.optimizers.Nadam(learning_rate=0.01)\n",
    "loss_fn = tf.keras.losses.sparse_categorical_crossentropy\n",
    "mean_loss = tf.keras.metrics.Mean()\n",
    "metrics = [tf.keras.metrics.SparseCategoricalAccuracy()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 249,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "a0c8a6efecb44efdbaf6f6f2107a37e6",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "ba37766cb41848b4ae0f544c8ddf238f",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 1/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "dc1d7d5c3f2148b1bb06e974bba09f52",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 2/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "a9fccf049df546079656b4fa4d53cf8a",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 3/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "e63ee530efcf46af907e7ee80bea8be0",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 4/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "a9bbff8ceb73461398293a4f5f1cade8",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 5/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
    "    for epoch in epochs:\n",
    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
    "            for step in steps:\n",
    "                X_batch, y_batch = random_batch(X_train, y_train)\n",
    "                with tf.GradientTape() as tape:\n",
    "                    y_pred = model(X_batch)\n",
    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
    "                    loss = tf.add_n([main_loss] + model.losses)\n",
    "                gradients = tape.gradient(loss, model.trainable_variables)\n",
    "                optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
    "                for variable in model.variables:\n",
    "                    if variable.constraint is not None:\n",
    "                        variable.assign(variable.constraint(variable))                    \n",
    "                status = OrderedDict()\n",
    "                mean_loss(loss)\n",
    "                status[\"loss\"] = mean_loss.result().numpy()\n",
    "                for metric in metrics:\n",
    "                    metric(y_batch, y_pred)\n",
    "                    status[metric.name] = metric.result().numpy()\n",
    "                steps.set_postfix(status)\n",
    "            y_pred = model(X_valid)\n",
    "            status[\"val_loss\"] = np.mean(loss_fn(y_valid, y_pred))\n",
    "            status[\"val_accuracy\"] = np.mean(tf.keras.metrics.sparse_categorical_accuracy(\n",
    "                tf.constant(y_valid, dtype=np.float32), y_pred))\n",
    "            steps.set_postfix(status)\n",
    "        for metric in [mean_loss] + metrics:\n",
    "            metric.reset_states()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### b.\n",
    "_Exercise: Try using a different optimizer with a different learning rate for the upper layers and the lower layers._"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 250,
   "metadata": {},
   "outputs": [],
   "source": [
    "tf.keras.utils.set_random_seed(42)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 251,
   "metadata": {},
   "outputs": [],
   "source": [
    "lower_layers = tf.keras.Sequential([\n",
    "    tf.keras.layers.Flatten(input_shape=[28, 28]),\n",
    "    tf.keras.layers.Dense(100, activation=\"relu\"),\n",
    "])\n",
    "upper_layers = tf.keras.Sequential([\n",
    "    tf.keras.layers.Dense(10, activation=\"softmax\"),\n",
    "])\n",
    "model = tf.keras.Sequential([\n",
    "    lower_layers, upper_layers\n",
    "])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 252,
   "metadata": {},
   "outputs": [],
   "source": [
    "lower_optimizer = tf.keras.optimizers.SGD(learning_rate=1e-4)\n",
    "upper_optimizer = tf.keras.optimizers.Nadam(learning_rate=1e-3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 253,
   "metadata": {},
   "outputs": [],
   "source": [
    "n_epochs = 5\n",
    "batch_size = 32\n",
    "n_steps = len(X_train) // batch_size\n",
    "loss_fn = tf.keras.losses.sparse_categorical_crossentropy\n",
    "mean_loss = tf.keras.metrics.Mean()\n",
    "metrics = [tf.keras.metrics.SparseCategoricalAccuracy()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 254,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "5bdc4d309e3e4f03a27150634a0b89c3",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "b816337dd6ba4177a8bcdd41639a8930",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 1/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "b4cba66f77474d2b9f9de9a207eadf6c",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 2/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "5649fae110bf4f90bce00b39838e05bf",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 3/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "7cd99923c6cc43e78faf87b13be2df7b",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 4/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "39ad913b024f4a2bb31477cfb2d61fbf",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "Epoch 5/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
    "    for epoch in epochs:\n",
    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
    "            for step in steps:\n",
    "                X_batch, y_batch = random_batch(X_train, y_train)\n",
    "                with tf.GradientTape(persistent=True) as tape:\n",
    "                    y_pred = model(X_batch)\n",
    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
    "                    loss = tf.add_n([main_loss] + model.losses)\n",
    "                for layers, optimizer in ((lower_layers, lower_optimizer),\n",
    "                                          (upper_layers, upper_optimizer)):\n",
    "                    gradients = tape.gradient(loss, layers.trainable_variables)\n",
    "                    optimizer.apply_gradients(zip(gradients, layers.trainable_variables))\n",
    "                del tape\n",
    "                for variable in model.variables:\n",
    "                    if variable.constraint is not None:\n",
    "                        variable.assign(variable.constraint(variable))                    \n",
    "                status = OrderedDict()\n",
    "                mean_loss(loss)\n",
    "                status[\"loss\"] = mean_loss.result().numpy()\n",
    "                for metric in metrics:\n",
    "                    metric(y_batch, y_pred)\n",
    "                    status[metric.name] = metric.result().numpy()\n",
    "                steps.set_postfix(status)\n",
    "            y_pred = model(X_valid)\n",
    "            status[\"val_loss\"] = np.mean(loss_fn(y_valid, y_pred))\n",
    "            status[\"val_accuracy\"] = np.mean(tf.keras.metrics.sparse_categorical_accuracy(\n",
    "                tf.constant(y_valid, dtype=np.float32), y_pred))\n",
    "            steps.set_postfix(status)\n",
    "        for metric in [mean_loss] + metrics:\n",
    "            metric.reset_states()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								{
 								 "cells": [
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "**Chapter 12 – Custom Models and Training with TensorFlow**"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "_This notebook contains all the sample code and solutions to the exercises in chapter 12, as well as code examples from Appendix C_"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "<table align=\"left\">\n",
 								    "  <td>\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    <a href=\"https://colab.research.google.com/github/ageron/handson-ml3/blob/main/12_custom_models_and_training_with_tensorflow.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "  </td>\n",
-												Update 12_custom_models_and_training_with_tensorflow.ipynb

add Open in Kaggle badge
											
										
										
											2021-05-25 05:08:03 +02:00
+								    "  <td>\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    <a target=\"_blank\" href=\"https://kaggle.com/kernels/welcome?src=https://github.com/ageron/handson-ml3/blob/main/12_custom_models_and_training_with_tensorflow.ipynb\"><img src=\"https://kaggle.com/static/images/open-in-kaggle.svg\" /></a>\n",
-												Update 12_custom_models_and_training_with_tensorflow.ipynb

add Open in Kaggle badge
											
										
										
											2021-05-25 05:08:03 +02:00
+								    "  </td>\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "</table>"
 								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "markdown",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "metadata": {
 								    "tags": []
 								   },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "# Setup"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Require Python 3.7+

											
										
										
											2022-02-19 11:03:20 +01:00
+								    "This project requires Python 3.7 or above:"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 1,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "import sys\n",
 								    "\n",
-												Require Python 3.7+

											
										
										
											2022-02-19 11:03:20 +01:00
+								    "assert sys.version_info >= (3, 7)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Upgrade to TensorFlow 2.8

											
										
										
											2022-02-28 23:41:27 +01:00
+								    "And TensorFlow ≥ 2.8:"
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 2,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Update lib versions and add pydot, fixes #29

											
										
										
											2022-09-22 09:14:01 +02:00
+								    "from packaging import version\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "import tensorflow as tf\n",
 								    "\n",
-												Update lib versions and add pydot, fixes #29

											
										
										
											2022-09-22 09:14:01 +02:00
+								    "assert version.parse(tf.__version__) >= version.parse(\"2.8.0\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## Using TensorFlow like NumPy"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "### Tensors and Operations"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Tensors"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 3,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
 								       "array([[1., 2., 3.],\n",
 								       "       [4., 5., 6.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 3,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "t = tf.constant([[1., 2., 3.], [4., 5., 6.]]) # matrix\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "t"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 4,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "TensorShape([2, 3])"
 								      ]
 								     },
 								     "execution_count": 4,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t.shape"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 5,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "tf.float32"
 								      ]
 								     },
 								     "execution_count": 5,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t.dtype"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Indexing"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 6,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
 								       "array([[2., 3.],\n",
 								       "       [5., 6.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 6,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t[:, 1:]"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 7,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 1), dtype=float32, numpy=\n",
 								       "array([[2.],\n",
 								       "       [5.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 7,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t[..., 1, tf.newaxis]"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Ops"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 8,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
 								       "array([[11., 12., 13.],\n",
 								       "       [14., 15., 16.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 8,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t + 10"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 9,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 3), dtype=float32, numpy=\n",
 								       "array([[ 1.,  4.,  9.],\n",
 								       "       [16., 25., 36.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 9,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "tf.square(t)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 10,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
 								       "array([[14., 32.],\n",
 								       "       [32., 77.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 10,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t @ tf.transpose(t)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Scalars"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 11,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=42>"
 								      ]
 								     },
 								     "execution_count": 11,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "tf.constant(42)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "#### Keras's low-level API"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "You may still run across code that uses Keras's low-level API:"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 12,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[11., 26.],\n",
 								       "       [14., 35.],\n",
 								       "       [19., 46.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 12,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "K = tf.keras.backend\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "K.square(K.transpose(t)) + 10"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "But since Keras does not support multiple backends anymore, you should instead use TF's low-level API directly:"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 13,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[11., 26.],\n",
 								       "       [14., 35.],\n",
 								       "       [19., 46.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 13,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.square(tf.transpose(t)) + 10"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Tensors and NumPy"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 14,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3,), dtype=float64, numpy=array([2., 4., 5.])>"
 								      ]
 								     },
 								     "execution_count": 14,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "import numpy as np\n",
 								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "a = np.array([2., 4., 5.])\n",
 								    "tf.constant(a)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 15,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "array([[1., 2., 3.],\n",
 								       "       [4., 5., 6.]], dtype=float32)"
 								      ]
 								     },
 								     "execution_count": 15,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t.numpy()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 16,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "array([[1., 2., 3.],\n",
 								       "       [4., 5., 6.]], dtype=float32)"
 								      ]
 								     },
 								     "execution_count": 16,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "np.array(t)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 17,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3,), dtype=float64, numpy=array([ 4., 16., 25.])>"
 								      ]
 								     },
 								     "execution_count": 17,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "tf.square(a)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 18,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "array([[ 1.,  4.,  9.],\n",
 								       "       [16., 25., 36.]], dtype=float32)"
 								      ]
 								     },
 								     "execution_count": 18,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "np.square(t)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "### Type Conversions"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 19,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "cannot compute AddV2 as input #1(zero-based) was expected to be a float tensor but is a int32 tensor [Op:AddV2] name: \n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "try:\n",
 								    "    tf.constant(2.0) + tf.constant(40)\n",
 								    "except tf.errors.InvalidArgumentError as ex:\n",
 								    "    print(ex)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 20,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "cannot compute AddV2 as input #1(zero-based) was expected to be a float tensor but is a double tensor [Op:AddV2] name: \n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "try:\n",
 								    "    tf.constant(2.0) + tf.constant(40., dtype=tf.float64)\n",
 								    "except tf.errors.InvalidArgumentError as ex:\n",
 								    "    print(ex)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 21,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=42.0>"
 								      ]
 								     },
 								     "execution_count": 21,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "t2 = tf.constant(40., dtype=tf.float64)\n",
 								    "tf.constant(2.0) + tf.cast(t2, tf.float32)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "### Variables"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 22,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'Variable:0' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[1., 2., 3.],\n",
 								       "       [4., 5., 6.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 22,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "v = tf.Variable([[1., 2., 3.], [4., 5., 6.]])\n",
 								    "v"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 23,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[ 2.,  4.,  6.],\n",
 								       "       [ 8., 10., 12.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 23,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "v.assign(2 * v)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 24,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[ 2., 42.,  6.],\n",
 								       "       [ 8., 10., 12.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 24,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "v[0, 1].assign(42)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 25,
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "metadata": {
 								    "tags": []
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[ 2., 42.,  0.],\n",
 								       "       [ 8., 10.,  1.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 25,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "v[:, 2].assign([0., 1.])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 26,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[100.,  42.,   0.],\n",
 								       "       [  8.,  10., 200.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 26,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "v.scatter_nd_update(\n",
 								    "    indices=[[0, 0], [1, 2]], updates=[100., 200.])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 27,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Variable 'UnreadVariable' shape=(2, 3) dtype=float32, numpy=\n",
 								       "array([[4., 5., 6.],\n",
 								       "       [1., 2., 3.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 27,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to use scatter_update()\n",
 								    "sparse_delta = tf.IndexedSlices(values=[[1., 2., 3.], [4., 5., 6.]],\n",
 								    "                                indices=[1, 0])\n",
 								    "v.scatter_update(sparse_delta)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 28,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "'ResourceVariable' object does not support item assignment\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "try:\n",
 								    "    v[1] = [7., 8., 9.]\n",
 								    "except TypeError as ex:\n",
 								    "    print(ex)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "### Strings"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "The code in this section and all the following sections  in appendix C"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 29,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=string, numpy=b'hello world'>"
 								      ]
 								     },
 								     "execution_count": 29,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "tf.constant(b\"hello world\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 30,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
 								      ]
 								     },
 								     "execution_count": 30,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.constant(\"café\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 31,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 31,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "u = tf.constant([ord(c) for c in \"café\"])\n",
 								    "u"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 32,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=4>"
 								      ]
 								     },
 								     "execution_count": 32,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "b = tf.strings.unicode_encode(u, \"UTF-8\")\n",
 								    "tf.strings.length(b, unit=\"UTF8_CHAR\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 33,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 33,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.strings.unicode_decode(b, \"UTF-8\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Other Data Structures"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "The code in this section is in Appendix C."
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### String arrays"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 34,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=string, numpy=b'hello world'>"
 								      ]
 								     },
 								     "execution_count": 34,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.constant(b\"hello world\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "code",
 								   "execution_count": 35,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
 								      ]
 								     },
 								     "execution_count": 35,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.constant(\"café\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 36,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 36,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "u = tf.constant([ord(c) for c in \"café\"])\n",
 								    "u"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 37,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=string, numpy=b'caf\\xc3\\xa9'>"
 								      ]
 								     },
 								     "execution_count": 37,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "b = tf.strings.unicode_encode(u, \"UTF-8\")\n",
 								    "b"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 38,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=4>"
 								      ]
 								     },
 								     "execution_count": 38,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.strings.length(b, unit=\"UTF8_CHAR\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 39,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([ 99,  97, 102, 233], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 39,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.strings.unicode_decode(b, \"UTF-8\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 40,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "p = tf.constant([\"Café\", \"Coffee\", \"caffè\", \"咖啡\"])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 41,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4,), dtype=int32, numpy=array([4, 6, 5, 2], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 41,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.strings.length(p, unit=\"UTF8_CHAR\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 42,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<tf.RaggedTensor [[67, 97, 102, 233], [67, 111, 102, 102, 101, 101],\n",
 								       " [99, 97, 102, 102, 232], [21654, 21857]]>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 42,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r = tf.strings.unicode_decode(p, \"UTF8\")\n",
 								    "r"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Ragged tensors"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 43,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(6,), dtype=int32, numpy=array([ 67, 111, 102, 102, 101, 101], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 43,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r[1]"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "code",
 								   "execution_count": 44,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.RaggedTensor [[67, 111, 102, 102, 101, 101], [99, 97, 102, 102, 232]]>"
 								      ]
 								     },
 								     "execution_count": 44,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r[1:3]  # extra code – a slice of a ragged tensor is a ragged tensor"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 45,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<tf.RaggedTensor [[67, 97, 102, 233], [67, 111, 102, 102, 101, 101],\n",
 								       " [99, 97, 102, 102, 232], [21654, 21857], [65, 66], [], [67]]>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 45,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r2 = tf.ragged.constant([[65, 66], [], [67]])\n",
 								    "tf.concat([r, r2], axis=0)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 46,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "<tf.RaggedTensor [[67, 97, 102, 233, 68, 69, 70], [67, 111, 102, 102, 101, 101, 71],\n",
 								      " [99, 97, 102, 102, 232], [21654, 21857, 72, 73]]>\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r3 = tf.ragged.constant([[68, 69, 70], [71], [], [72, 73]])\n",
 								    "print(tf.concat([r, r3], axis=1))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 47,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(4, 6), dtype=int32, numpy=\n",
 								       "array([[   67,    97,   102,   233,     0,     0],\n",
 								       "       [   67,   111,   102,   102,   101,   101],\n",
 								       "       [   99,    97,   102,   102,   232,     0],\n",
 								       "       [21654, 21857,     0,     0,     0,     0]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 47,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "r.to_tensor()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Sparse tensors"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 48,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "s = tf.SparseTensor(indices=[[0, 1], [1, 0], [2, 3]],\n",
 								    "                    values=[1., 2., 3.],\n",
 								    "                    dense_shape=[3, 4])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 49,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 4), dtype=float32, numpy=\n",
 								       "array([[0., 1., 0., 0.],\n",
 								       "       [2., 0., 0., 0.],\n",
 								       "       [0., 0., 0., 3.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 49,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.sparse.to_dense(s)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 50,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "SparseTensor(indices=tf.Tensor(\n",
 								       "[[0 1]\n",
 								       " [1 0]\n",
 								       " [2 3]], shape=(3, 2), dtype=int64), values=tf.Tensor([ 42.  84. 126.], shape=(3,), dtype=float32), dense_shape=tf.Tensor([3 4], shape=(2,), dtype=int64))"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 50,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "s * 42.0"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 51,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "unsupported operand type(s) for +: 'SparseTensor' and 'float'\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "try:\n",
 								    "    s + 42.0\n",
 								    "except TypeError as ex:\n",
 								    "    print(ex)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 52,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[ 30.,  40.],\n",
 								       "       [ 20.,  40.],\n",
 								       "       [210., 240.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 52,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to multiply a sparse tensor and a dense tensor\n",
 								    "s4 = tf.constant([[10., 20.], [30., 40.], [50., 60.], [70., 80.]])\n",
 								    "tf.sparse.sparse_dense_matmul(s, s4)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 53,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "{{function_node __wrapped__SparseToDense_device_/job:localhost/replica:0/task:0/device:CPU:0}} indices[1] = [0,1] is out of order. Many sparse ops require sorted indices.\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "    Use `tf.sparse.reorder` to create a correctly ordered copy.\n",
 								      "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      " [Op:SparseToDense] name: \n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "2023-09-05 11:03:52.814492: W tensorflow/core/framework/op_kernel.cc:1828] OP_REQUIRES failed at sparse_to_dense_op.cc:161 : INVALID_ARGUMENT: indices[1] = [0,1] is out of order. Many sparse ops require sorted indices.\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "    Use `tf.sparse.reorder` to create a correctly ordered copy.\n",
 								      "\n",
 								      "\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – when creating a sparse tensor, values must be given in \"reading\n",
 								    "#              order\", or else `to_dense()` will fail.\n",
 								    "s5 = tf.SparseTensor(indices=[[0, 2], [0, 1]],  # WRONG ORDER!\n",
 								    "                     values=[1., 2.],\n",
 								    "                     dense_shape=[3, 4])\n",
 								    "try:\n",
 								    "    tf.sparse.to_dense(s5)\n",
 								    "except tf.errors.InvalidArgumentError as ex:\n",
 								    "    print(ex)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 54,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 4), dtype=float32, numpy=\n",
 								       "array([[0., 2., 1., 0.],\n",
 								       "       [0., 0., 0., 0.],\n",
 								       "       [0., 0., 0., 0.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 54,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to fix the sparse tensor s5 by reordering its values\n",
 								    "s6 = tf.sparse.reorder(s5)\n",
 								    "tf.sparse.to_dense(s6)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Tensor Arrays"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 55,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "array = tf.TensorArray(dtype=tf.float32, size=3)\n",
 								    "array = array.write(0, tf.constant([1., 2.]))\n",
 								    "array = array.write(1, tf.constant([3., 10.]))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "array = array.write(2, tf.constant([5., 7.]))\n",
 								    "tensor1 = array.read(1)  # returns (and zeros out!) tf.constant([3., 10.])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 56,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[1., 2.],\n",
 								       "       [0., 0.],\n",
 								       "       [5., 7.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 56,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "array.stack()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 57,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[ 1.,  2.],\n",
 								       "       [ 3., 10.],\n",
 								       "       [ 5.,  7.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 57,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to disable clear_after_read\n",
 								    "array2 = tf.TensorArray(dtype=tf.float32, size=3, clear_after_read=False)\n",
 								    "array2 = array2.write(0, tf.constant([1., 2.]))\n",
 								    "array2 = array2.write(1, tf.constant([3., 10.]))\n",
 								    "array2 = array2.write(2, tf.constant([5., 7.]))\n",
 								    "tensor2 = array2.read(1)  # returns tf.constant([3., 10.])\n",
 								    "array2.stack()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 58,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3, 2), dtype=float32, numpy=\n",
 								       "array([[1., 2.],\n",
 								       "       [0., 0.],\n",
 								       "       [5., 7.]], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 58,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to create and use a tensor array with a dynamic size\n",
 								    "array3 = tf.TensorArray(dtype=tf.float32, size=0, dynamic_size=True)\n",
 								    "array3 = array3.write(0, tf.constant([1., 2.]))\n",
 								    "array3 = array3.write(1, tf.constant([3., 10.]))\n",
 								    "array3 = array3.write(2, tf.constant([5., 7.]))\n",
 								    "tensor3 = array3.read(1)\n",
 								    "array3.stack()"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "#### Sets"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 59,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "SparseTensor(indices=tf.Tensor(\n",
 								       "[[0 0]\n",
 								       " [0 1]\n",
 								       " [0 2]\n",
 								       " [0 3]\n",
 								       " [0 4]], shape=(5, 2), dtype=int64), values=tf.Tensor([ 1  5  6  9 11], shape=(5,), dtype=int32), dense_shape=tf.Tensor([1 5], shape=(2,), dtype=int64))"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 59,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "a = tf.constant([[1, 5, 9]])\n",
 								    "b = tf.constant([[5, 6, 9, 11]])\n",
 								    "u = tf.sets.union(a, b)\n",
 								    "u"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "code",
 								   "execution_count": 60,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(1, 5), dtype=int32, numpy=array([[ 1,  5,  6,  9, 11]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 60,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.sparse.to_dense(u)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 61,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 5), dtype=int32, numpy=\n",
 								       "array([[ 1,  5,  6,  9, 11],\n",
 								       "       [ 0, 10, 13,  0,  0]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 61,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "a = tf.constant([[1, 5, 9], [10, 0, 0]])\n",
 								    "b = tf.constant([[5, 6, 9, 11], [13, 0, 0, 0]])\n",
 								    "u = tf.sets.union(a, b)\n",
 								    "tf.sparse.to_dense(u)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 62,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 5), dtype=int32, numpy=\n",
 								       "array([[ 1,  5,  6,  9, 11],\n",
 								       "       [-1, 10, 13, -1, -1]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 62,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "# extra code – shows how to use a different default value: -1 in this case\n",
 								    "a = tf.constant([[1, 5, 9], [10, -1, -1]])\n",
 								    "b = tf.constant([[5, 6, 9, 11], [13, -1, -1, -1]])\n",
 								    "u = tf.sets.union(a, b)\n",
 								    "tf.sparse.to_dense(u, default_value=-1)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 63,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 3), dtype=int32, numpy=\n",
 								       "array([[2, 3, 7],\n",
 								       "       [7, 0, 0]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 63,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "# extra code – shows how to use `tf.sets.difference()`\n",
 								    "set1 = tf.constant([[2, 3, 5, 7], [7, 9, 0, 0]])\n",
 								    "set2 = tf.constant([[4, 5, 6], [9, 10, 0]])\n",
 								    "tf.sparse.to_dense(tf.sets.difference(set1, set2))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 64,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(2, 2), dtype=int32, numpy=\n",
 								       "array([[5, 0],\n",
 								       "       [0, 9]], dtype=int32)>"
 								      ]
 								     },
 								     "execution_count": 64,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "# extra code – shows how to use `tf.sets.difference()`\n",
 								    "tf.sparse.to_dense(tf.sets.intersection(set1, set2))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 65,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(1,), dtype=bool, numpy=array([ True])>"
 								      ]
 								     },
 								     "execution_count": 65,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "# extra code – check whether set1[0] contains 5\n",
 								    "tf.sets.size(tf.sets.intersection(set1[:1], tf.constant([[5, 0, 0, 0]]))) > 0"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "#### Queues"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 66,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
 								      ]
 								     },
 								     "execution_count": 66,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "q = tf.queue.FIFOQueue(3, [tf.int32, tf.string], shapes=[(), ()])\n",
 								    "q.enqueue([10, b\"windy\"])\n",
 								    "q.enqueue([15, b\"sunny\"])\n",
 								    "q.size()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 67,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=int32, numpy=10>,\n",
 								       " <tf.Tensor: shape=(), dtype=string, numpy=b'windy'>]"
 								      ]
 								     },
 								     "execution_count": 67,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "q.dequeue()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 68,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "q.enqueue_many([[13, 16], [b'cloudy', b'rainy']])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 69,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(3,), dtype=int32, numpy=array([15, 13, 16], dtype=int32)>,\n",
 								       " <tf.Tensor: shape=(3,), dtype=string, numpy=array([b'sunny', b'cloudy', b'rainy'], dtype=object)>]"
 								      ]
 								     },
 								     "execution_count": 69,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "q.dequeue_many(3)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Custom loss function"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 70,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "def huber_fn(y_true, y_pred):\n",
 								    "    error = y_true - y_pred\n",
 								    "    is_small_error = tf.abs(error) < 1\n",
 								    "    squared_loss = tf.square(error) / 2\n",
 								    "    linear_loss  = tf.abs(error) - 0.5\n",
 								    "    return tf.where(is_small_error, squared_loss, linear_loss)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 71,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAqQAAAFkCAYAAAD2RimAAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjUuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/NK7nSAAAACXBIWXMAAA9hAAAPYQGoP6dpAAB5/UlEQVR4nO3dd1xV5R/A8c9lg4IbRQVn7hmWYu49Mi3LmaOyX+YoMzNRK83VMHPkzJWaq9w5McW9cKSZmeZWECcoMi5wfn88XRAB5V7GuRe+79eLl5zDPfd+eTzc+z3PeZ7vY9A0TUMIIYQQQgid2OkdgBBCCCGEyNkkIRVCCCGEELqShFQIIYQQQuhKElIhhBBCCKErSUiFEEIIIYSuJCEVQgghhBC6koRUCCGEEELoShJSIYQQQgihK0lIhRBCCCGEriQhFUKIVIwaNQqDwUBgYKDeoSTTqFEjDAaD3mEIIUSGkIRUCGFTLl26hMFgoFWrVqk+5uDBgxgMBnr37p11gQkhhLCYJKRCCCGEEEJXkpAKIYQQQghdSUIqhMgxSpYsScmSJVP82bPGZP74449UrlwZFxcXfHx88Pf3JyoqKsXHnjx5ki5duuDl5YWTkxMlSpRg4MCB3LlzJ8njTMMPevfuzd9//81rr71GwYIFMRgMXLp0yaLfMTY2lu+//57q1avj6upKnjx5aNy4MRs3bkz22Pj4eObOncuLL75I/vz5cXNzo2TJknTo0IHdu3cneeyqVato2LAhnp6euLi44O3tTatWrVi7dq1FcQohxOMc9A5ACCGs3XfffUdgYCCdO3fm5ZdfZtOmTXz11VccP36czZs3J0lk169fT6dOnbC3t+eVV17B29ubv/76ix9++IGtW7dy6NAh8uXLl+T5z58/T506dahcuTK9evXi7t27ODk5mR2npml07tyZ1atXU65cOfr3709ERAQrV67k5ZdfZsqUKXzwwQcJj/f39+ebb76hTJkydOvWDXd3d65fv86ePXvYsWMHDRo0AGDmzJn069cPLy8vXn31VQoUKEBwcDCHDx9m7dq1dOjQwbKGFUKI/0hCKoSwSefPn2fUqFEp/uzatWsZ+lrbt28nKCiIypUrAzBu3DjatGnD1q1bWbJkCT169ADgzp079OjRg0KFCrFv3z58fHwSnmPZsmV069aNzz//nGnTpiV5/n379vHZZ5/x5ZdfpivOJUuWsHr1aho2bMi2bdsSktoRI0bg6+vLkCFDaNeuHaVKlQJg7ty5FCtWjJMnT+Lm5pbwPJqmce/evYTtuXPn4uTkxB9//EGhQoWSvOaTvb5CCGEJSUiFEDbp33//ZfTo0VnyWj169EhIRgEcHBwYP348AQEB/PTTTwkJ6aJFiwgPD2f69OlJklGArl27MnHiRJYvX54sIS1SpAgjR45Md5wLFy4E4JtvvknSw1q8eHE++ugj/P39+fnnn5O8lpOTEw4OST8KDAYD+fPnT7LP0dERR0fHZK9ZoECBdMcthBCSkAohbFLLli3ZsmVLij87ePAgfn5+GfZa9evXT7avVq1auLq6cuLEiSSva/r3/PnzyY6Jiori9u3b3L59m4IFCybsr169ukW36J90/PhxXF1defHFF5P9rFGjRgBJ4u3UqROzZs2iSpUqdO7cmYYNG+Ln50euXLmSHNupUyeGDRtGlSpV6NKlC40aNaJevXrkzZs33TELIQRIQiqEEM/k6emZ6v7r168nbN+9exeA6dOnP/X5IiIikiSkhQsXzoAoITw8HG9v7xR/VqRIEQDCwsIS9k2dOpXSpUuzcOFCxo4dy9ixY3FxcaFTp0589913CTEOHTqUAgUKMGvWLCZNmsR3332Hg4MDbdq0YfLkyQlDAIQQwlIyy14IkWPY2dkRGxub4s8eT9SeFBoamur+PHnyJGx7eHgAcOrUKTRNS/WrRIkSSZ4no1Zc8vDw4ObNmyn+zLTfFCOo2/CffPIJp0+f5vr16yxdupT69euzaNEiunfvniS+Pn36EBQUxK1bt1izZg2vvfYa69evp23btsTFxWVI/EKInEsSUiFEjpEvXz5CQ0OTJaURERGcO3cu1eP27NmTbF9QUBCRkZHUqFEjYV/t2rUBOHDgQMYEbKaaNWsSGRnJ4cOHk/1s165dAEnifVzRokXp2rUrW7Zs4bnnnmP79u1ERkYme1yBAgXo0KEDK1asoEmTJpw5cybF4QlCCGEOSUiFEDlGrVq1MBqN/Pzzzwn7NE3D39+fiIiIVI9bvHgxp0+fTtiOjY1l+PDhAPTq1Sth/1tvvYW7uzsjRoxI8niTR48eJYwzzQymWPz9/TEajQn7r1+/zqRJk3BwcEjo+YyOjmbHjh1ompbkOSIiInjw4AGOjo7Y29sDsHXr1mRJvNFoTBii4Orqmmm/kxAiZ5AxpEKIHGPAgAEsWLCAPn36EBAQQKFChdizZw/379+nevXq/PHHHyke16xZM+rUqUOXLl3Inz8/mzZt4s8//6Rly5a8+eabCY8rVKgQy5Yt44033qB69eq0atWKChUqEBUVxeXLl9m1axd169ZNdTJWevXo0YPVq1ezbt06qlWrxssvv5xQh/TOnTt89913lC5dGoDIyEiaNm1K6dKlqV27Nj4+Pjx8+JDffvuNkJAQPv3004SJVp07d8bNzY169epRokQJjEYjAQEB/PXXX3Tu3DlZRQEhhDCXJKRCiByjatWqbNmyheHDh/Prr7+SO3du2rRpw7fffkvnzp1TPe7jjz+mXbt2TJkyhX///ZdChQoxbNgwPv/882TjP9u2bcvx48f59ttv2b59OwEBAeTKlYvixYvz1ltvJUlgM5rBYODXX39lypQp/PTTT0ybNg0nJyeef/55Bg8ezCuvvJLw2Fy5cvH111/z+++/s2fPHkJDQ8mXLx8VKlTg66+/TtIeEyZMYMuWLRw+fJgNGzaQK1cuypYty+zZs3n77bcz7fcRQuQcBu3J+zVCCCGEEEJkIRlDKoQQQgghdCUJqRBCCCGE0JUkpEIIIYQQQlfpSkgnTJiAwWBg0KBBT33crl278PX1xcXFhdKlSzNr1qz0vKwQQgghhMhGLE5Ijxw5wpw5c6hWrdpTH3fx4kXatGlD/fr1OX78OMOHD+eDDz5g1apVlr60EEIIIYTIRixKSB8+fEj37t358ccfyZcv31MfO2vWLHx8fJg8eTIVK1akT58+vP3220ycONGigIUQQgghRPZiUR3S/v3707ZtW5o1a8bYsWOf+tgDBw7QokWLJPtatmzJvHnzMBqNODo6JjsmOjqa6OjohO34+Hju3r1LgQIFMmzNZyGEEEIIkXE0TePBgwcULVoUOzvz+jzNTkiXL1/OsWPHOHLkSJoeHxISQuHChZPsK1y4MLGxsdy+fRsvL69kx0yYMIHRo0ebG5oQQgghhNDZ1atXKV68uFnHmJWQXr16lQ8//JBt27bh4uKS5uOe7NU01eJPrbfT39+fwYMHJ2yHhYXh4+PDP//8Q/78+c0JOccyGo3s3LmTxo0bp9gLnRq7WbPQPD3RXnstE6OzXpa2W04mbWa+iIgISpQoAcC///5Lnjx5dI7INsi5Zpmc3G6Ggwexb9eO2O3boXr1NB+Xk9ssPe7evUu5cuVwd3c3+1izEtKjR48SGhqKr69vwr64uDh2797NDz/8QHR0NPb29kmOKVKkCCEhIUn2hYaG4uDgQIECBVJ8HWdnZ5ydnZPtz58/f6rHiKSMRiNubm4UKFDAvD+mESMyLygbYHG75WDSZuZ7/II+f/785M2bV79gbIica5bJ0e3WsCH89BM0agRm3ELO0W2WASwZXmlWQtq0aVNOnTqVZN9bb71FhQoV+PTTT5MlowB+fn5s2LAhyb5t27ZRq1Yt+U+2VhcvwubN0K+f3pEIIYQQlsudG3r00DsKkQZmjTh1d3enSpUqSb5y5cpFgQIFqFKlCqBut/fs2TPhmL59+3L58mUGDx7MmTNnmD9/PvPmzWPIkCEZ+5uIjHPwIHz+Ody9q3ckQgghhGVmzoRRo/SOQqRRhq/UFBwczJUrVxK2S5UqxaZNmwg
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<Figure size 800x350 with 1 Axes>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								     "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     "output_type": "display_data"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows what the Huber loss looks like\n",
 								    "\n",
 								    "import matplotlib.pyplot as plt\n",
 								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "plt.figure(figsize=(8, 3.5))\n",
 								    "z = np.linspace(-4, 4, 200)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "z_center = np.linspace(-1, 1, 200)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "plt.plot(z, huber_fn(0, z), \"b-\", linewidth=2, label=\"huber($z$)\")\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "plt.plot(z, z ** 2 / 2, \"r:\", linewidth=1)\n",
 								    "plt.plot(z_center, z_center ** 2 / 2, \"r\", linewidth=2)\n",
 								    "plt.plot([-1, -1], [0, huber_fn(0., -1.)], \"k--\")\n",
 								    "plt.plot([1, 1], [0, huber_fn(0., 1.)], \"k--\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "plt.gca().axhline(y=0, color='k')\n",
 								    "plt.gca().axvline(x=0, color='k')\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "plt.text(2.1, 3.5, r\"$\\frac{1}{2}z^2$\", color=\"r\", fontsize=15)\n",
 								    "plt.text(3.0, 2.2, r\"$|z| - \\frac{1}{2}$\", color=\"b\", fontsize=15)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "plt.axis([-4, 4, 0, 4])\n",
 								    "plt.grid(True)\n",
 								    "plt.xlabel(\"$z$\")\n",
 								    "plt.legend(fontsize=14)\n",
 								    "plt.title(\"Huber loss\", fontsize=14)\n",
 								    "plt.show()"
 								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "To test our custom loss function, let's create a basic Keras model and train it on the California housing dataset:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 72,
 								   "metadata": {
 								    "tags": []
 								   },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – loads, splits and scales the California housing dataset, then\n",
 								    "#              creates a simple Keras model\n",
 								    "\n",
 								    "from sklearn.datasets import fetch_california_housing\n",
 								    "from sklearn.model_selection import train_test_split\n",
 								    "from sklearn.preprocessing import StandardScaler\n",
 								    "\n",
 								    "housing = fetch_california_housing()\n",
 								    "X_train_full, X_test, y_train_full, y_test = train_test_split(\n",
 								    "    housing.data, housing.target.reshape(-1, 1), random_state=42)\n",
 								    "X_train, X_valid, y_train, y_valid = train_test_split(\n",
 								    "    X_train_full, y_train_full, random_state=42)\n",
 								    "\n",
 								    "scaler = StandardScaler()\n",
 								    "X_train_scaled = scaler.fit_transform(X_train)\n",
 								    "X_valid_scaled = scaler.transform(X_valid)\n",
 								    "X_test_scaled = scaler.transform(X_test)\n",
 								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "input_shape = X_train.shape[1:]\n",
 								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 73,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=huber_fn, optimizer=\"nadam\", metrics=[\"mae\"])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 74,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.4858 - mae: 0.8357 - val_loss: 0.3479 - val_mae: 0.6527\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.2415 - mae: 0.5419 - val_loss: 0.2630 - val_mae: 0.5473\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19a5004c0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 74,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Saving/Loading Models with Custom Objects"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 75,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss/assets\n"
 								     ]
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss/assets\n"
 								     ]
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_model_with_a_custom_loss\")  # extra code – saving works fine"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 76,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss\",\n",
 								    "                                   custom_objects={\"huber_fn\": huber_fn})"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 77,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.2052 - mae: 0.4910 - val_loss: 0.2210 - val_mae: 0.4946\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.1888 - mae: 0.4683 - val_loss: 0.2021 - val_mae: 0.4773\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19a876dd0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 77,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 78,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "def create_huber(threshold=1.0):\n",
 								    "    def huber_fn(y_true, y_pred):\n",
 								    "        error = y_true - y_pred\n",
 								    "        is_small_error = tf.abs(error) < threshold\n",
 								    "        squared_loss = tf.square(error) / 2\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        linear_loss  = threshold * tf.abs(error) - threshold ** 2 / 2\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        return tf.where(is_small_error, squared_loss, linear_loss)\n",
 								    "    return huber_fn"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 79,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=create_huber(2.0), optimizer=\"nadam\", metrics=[\"mae\"])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 80,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.2051 - mae: 0.4598 - val_loss: 0.2249 - val_mae: 0.4582\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.1982 - mae: 0.4531 - val_loss: 0.2035 - val_mae: 0.4527\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19abec4f0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 80,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 81,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_threshold_2/assets\n"
 								     ]
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_threshold_2/assets\n"
 								     ]
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_model_with_a_custom_loss_threshold_2\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 82,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss_threshold_2\",\n",
 								    "                                   custom_objects={\"huber_fn\": create_huber(2.0)})"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 83,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.1935 - mae: 0.4465 - val_loss: 0.2020 - val_mae: 0.4410\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.1899 - mae: 0.4422 - val_loss: 0.1867 - val_mae: 0.4399\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19ae75c30>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 83,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 84,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class HuberLoss(tf.keras.losses.Loss):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, threshold=1.0, **kwargs):\n",
 								    "        self.threshold = threshold\n",
 								    "        super().__init__(**kwargs)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def call(self, y_true, y_pred):\n",
 								    "        error = y_true - y_pred\n",
 								    "        is_small_error = tf.abs(error) < self.threshold\n",
 								    "        squared_loss = tf.square(error) / 2\n",
 								    "        linear_loss  = self.threshold * tf.abs(error) - self.threshold**2 / 2\n",
 								    "        return tf.where(is_small_error, squared_loss, linear_loss)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
 								    "        return {**base_config, \"threshold\": self.threshold}"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 85,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – creates another basic Keras model\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 86,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=HuberLoss(2.), optimizer=\"nadam\", metrics=[\"mae\"])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 87,
-												Update notebooks to latest nbformat

											
										
										
											2020-04-06 09:13:12 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.6492 - mae: 0.8468 - val_loss: 0.5093 - val_mae: 0.6723\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.2912 - mae: 0.5552 - val_loss: 0.3715 - val_mae: 0.5683\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19b1356c0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 87,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 88,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_class/assets\n"
 								     ]
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_loss_class/assets\n"
 								     ]
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_model_with_a_custom_loss_class\")  # extra code – saving works"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 89,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model = tf.keras.models.load_model(\"my_model_with_a_custom_loss_class\",\n",
 								    "                                   custom_objects={\"HuberLoss\": HuberLoss})"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 90,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.2416 - mae: 0.5034 - val_loss: 0.2922 - val_mae: 0.5057\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.2173 - mae: 0.4774 - val_loss: 0.2503 - val_mae: 0.4843\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19a781c60>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 90,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows that loading worked fine, the model can be used normally\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 91,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "2.0"
 								      ]
 								     },
 								     "execution_count": 91,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.loss.threshold  # extra code – the treshold was loaded correctly"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Other Custom Functions"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 92,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "def my_softplus(z):\n",
 								    "    return tf.math.log(1.0 + tf.exp(z))\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
 								    "def my_glorot_initializer(shape, dtype=tf.float32):\n",
 								    "    stddev = tf.sqrt(2. / (shape[0] + shape[1]))\n",
 								    "    return tf.random.normal(shape, stddev=stddev, dtype=dtype)\n",
 								    "\n",
 								    "def my_l1_regularizer(weights):\n",
 								    "    return tf.reduce_sum(tf.abs(0.01 * weights))\n",
 								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "def my_positive_weights(weights):  # return value is just tf.nn.relu(weights)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    return tf.where(weights < 0., tf.zeros_like(weights), weights)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 93,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "layer = tf.keras.layers.Dense(1, activation=my_softplus,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "                              kernel_initializer=my_glorot_initializer,\n",
 								    "                              kernel_regularizer=my_l1_regularizer,\n",
 								    "                              kernel_constraint=my_positive_weights)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 94,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 1.4714 - mae: 0.8316 - val_loss: inf - val_mae: inf\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.8094 - mae: 0.6172 - val_loss: 2.6153 - val_mae: 0.6058\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.6333 - mae: 0.5617 - val_loss: 1.1687 - val_mae: 0.5468\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.5570 - mae: 0.5303 - val_loss: 1.0440 - val_mae: 0.5250\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19b868640>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 94,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – show that building, training, saving, loading, and training again\n",
 								    "#              works fine with a model containing many custom parts\n",
 								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1, activation=my_softplus,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "                          kernel_initializer=my_glorot_initializer,\n",
 								    "                          kernel_regularizer=my_l1_regularizer,\n",
 								    "                          kernel_constraint=my_positive_weights)\n",
 								    "])\n",
 								    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[\"mae\"])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "          validation_data=(X_valid_scaled, y_valid))\n",
 								    "model.save(\"my_model_with_many_custom_parts\")\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.models.load_model(\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    \"my_model_with_many_custom_parts\",\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    custom_objects={\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "       \"my_l1_regularizer\": my_l1_regularizer,\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "       \"my_positive_weights\": my_positive_weights,\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "       \"my_glorot_initializer\": my_glorot_initializer,\n",
 								    "       \"my_softplus\": my_softplus,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    }\n",
 								    ")\n",
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 95,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class MyL1Regularizer(tf.keras.regularizers.Regularizer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, factor):\n",
 								    "        self.factor = factor\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __call__(self, weights):\n",
 								    "        return tf.reduce_sum(tf.abs(self.factor * weights))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def get_config(self):\n",
 								    "        return {\"factor\": self.factor}"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 96,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 1.4714 - mae: 0.8316 - val_loss: inf - val_mae: inf\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 998us/step - loss: 0.8094 - mae: 0.6172 - val_loss: 2.6153 - val_mae: 0.6058\n",
 								      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_many_custom_parts/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.6333 - mae: 0.5617 - val_loss: 1.1687 - val_mae: 0.5468\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.5570 - mae: 0.5303 - val_loss: 1.0440 - val_mae: 0.5250\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19b8db610>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 96,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – again, show that everything works fine, this time using our\n",
 								    "#              custom regularizer class\n",
 								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1, activation=my_softplus,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "                          kernel_regularizer=MyL1Regularizer(0.01),\n",
 								    "                          kernel_constraint=my_positive_weights,\n",
 								    "                          kernel_initializer=my_glorot_initializer),\n",
 								    "])\n",
 								    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[\"mae\"])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "          validation_data=(X_valid_scaled, y_valid))\n",
 								    "model.save(\"my_model_with_many_custom_parts\")\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.models.load_model(\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    \"my_model_with_many_custom_parts\",\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    custom_objects={\n",
 								    "       \"MyL1Regularizer\": MyL1Regularizer,\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "       \"my_positive_weights\": my_positive_weights,\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "       \"my_glorot_initializer\": my_glorot_initializer,\n",
 								    "       \"my_softplus\": my_softplus,\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    }\n",
 								    ")\n",
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## Custom Metrics"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 97,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – once again, lets' create a basic Keras model\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 98,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=\"mse\", optimizer=\"nadam\", metrics=[create_huber(2.0)])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 99,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 844us/step - loss: 1.7474 - huber_fn: 0.6846\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 796us/step - loss: 0.7843 - huber_fn: 0.3136\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19b4fcf10>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 99,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – train the model with our custom metric\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "**Note**: if you use the same function as the loss and a metric, you may be surprised to see slightly different results. This is in part because the operations are not computed exactly in the same order, so there might be tiny floating point errors. More importantly, if you use sample weights or class weights, then the equations are a bit different:\n",
 								    "* the `fit()` method keeps track of the mean of all batch losses seen so far since the start of the epoch. Each batch loss is the sum of the weighted instance losses divided by the _batch size_ (not the sum of weights, so the batch loss is _not_ the weighted mean of the losses).\n",
 								    "* the metric since the start of the epoch is equal to the sum of weighted instance losses divided by sum of all weights seen so far. In other words, it is the weighted mean of all the instance losses. Not the same thing."
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Streaming metrics"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 100,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=0.8>"
 								      ]
 								     },
 								     "execution_count": 100,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "precision = tf.keras.metrics.Precision()\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "precision([0, 1, 1, 1, 0, 1, 0, 1], [1, 1, 0, 1, 0, 1, 0, 1])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 101,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=0.5>"
 								      ]
 								     },
 								     "execution_count": 101,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "precision([0, 1, 0, 0, 1, 0, 1, 1], [1, 0, 1, 1, 0, 0, 0, 0])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 102,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=0.5>"
 								      ]
 								     },
 								     "execution_count": 102,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "precision.result()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 103,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Variable 'true_positives:0' shape=(1,) dtype=float32, numpy=array([4.], dtype=float32)>,\n",
 								       " <tf.Variable 'false_positives:0' shape=(1,) dtype=float32, numpy=array([4.], dtype=float32)>]"
 								      ]
 								     },
 								     "execution_count": 103,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "precision.variables"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 104,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "precision.reset_states()"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Creating a streaming metric:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 105,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class HuberMetric(tf.keras.metrics.Metric):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, threshold=1.0, **kwargs):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        super().__init__(**kwargs)  # handles base args (e.g., dtype)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        self.threshold = threshold\n",
-												Update libraries to latest version, including TensorFlow 2.4.1 and Scikit-Learn 0.24.1

											
										
										
											2021-02-14 03:02:09 +01:00
+								    "        self.huber_fn = create_huber(threshold)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        self.total = self.add_weight(\"total\", initializer=\"zeros\")\n",
 								    "        self.count = self.add_weight(\"count\", initializer=\"zeros\")\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def update_state(self, y_true, y_pred, sample_weight=None):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        sample_metrics = self.huber_fn(y_true, y_pred)\n",
 								    "        self.total.assign_add(tf.reduce_sum(sample_metrics))\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        self.count.assign_add(tf.cast(tf.size(y_true), tf.float32))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def result(self):\n",
 								    "        return self.total / self.count\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
 								    "        return {**base_config, \"threshold\": self.threshold}"
 								   ]
 								  },
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "**Extra material** – the rest of this section tests the `HuberMetric` class and shows another implementation subclassing `tf.keras.metrics.Mean`."
 								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 106,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=14.0>"
 								      ]
 								     },
 								     "execution_count": 106,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "m = HuberMetric(2.)\n",
 								    "\n",
 								    "# total = 2 * |10 - 2| - 2²/2 = 14\n",
 								    "# count = 1\n",
 								    "# result = 14 / 1 = 14\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "m(tf.constant([[2.]]), tf.constant([[10.]]))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 107,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=7.0>"
 								      ]
 								     },
 								     "execution_count": 107,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "# total = total + (|1 - 0|² / 2) + (2 * |9.25 - 5| - 2² / 2) = 14 + 7 = 21\n",
 								    "# count = count + 2 = 3\n",
 								    "# result = total / count = 21 / 3 = 7\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "m(tf.constant([[0.], [5.]]), tf.constant([[1.], [9.25]]))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 108,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=7.0>"
 								      ]
 								     },
 								     "execution_count": 108,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "m.result()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 109,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Variable 'total:0' shape=() dtype=float32, numpy=21.0>,\n",
 								       " <tf.Variable 'count:0' shape=() dtype=float32, numpy=3.0>]"
 								      ]
 								     },
 								     "execution_count": 109,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "m.variables"
 								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "code",
 								   "execution_count": 110,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Variable 'total:0' shape=() dtype=float32, numpy=0.0>,\n",
 								       " <tf.Variable 'count:0' shape=() dtype=float32, numpy=0.0>]"
 								      ]
 								     },
 								     "execution_count": 110,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "m.reset_states()\n",
 								    "m.variables"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Let's check that the `HuberMetric` class works well:"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 111,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 112,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.compile(loss=create_huber(2.0), optimizer=\"nadam\",\n",
 								    "              metrics=[HuberMetric(2.0)])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 113,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 886us/step - loss: 0.6492 - huber_metric_1: 0.6492\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 838us/step - loss: 0.2912 - huber_metric_1: 0.2912\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19c2d1300>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 113,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 114,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric/assets\n"
 								     ]
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric/assets\n"
 								     ]
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_model_with_a_custom_metric\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 115,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model = tf.keras.models.load_model(\n",
 								    "    \"my_model_with_a_custom_metric\",\n",
 								    "    custom_objects={\n",
 								    "        \"huber_fn\": create_huber(2.0),\n",
 								    "        \"HuberMetric\": HuberMetric\n",
 								    "    }\n",
 								    ")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 116,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 916us/step - loss: 0.2416 - huber_metric_1: 0.2416\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 859us/step - loss: 0.2173 - huber_metric_1: 0.2173\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19b5f0130>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 116,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "`model.metrics` contains the model's loss followed by the model's metric(s), so the `HuberMetric` is `model.metrics[-1]`:"
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 117,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "2.0"
 								      ]
 								     },
 								     "execution_count": 117,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								    "model.metrics[-1].threshold"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Looks like it works fine! More simply, we could have created the class like this:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 118,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class HuberMetric(tf.keras.metrics.Mean):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, threshold=1.0, name='HuberMetric', dtype=None):\n",
 								    "        self.threshold = threshold\n",
 								    "        self.huber_fn = create_huber(threshold)\n",
 								    "        super().__init__(name=name, dtype=dtype)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def update_state(self, y_true, y_pred, sample_weight=None):\n",
 								    "        metric = self.huber_fn(y_true, y_pred)\n",
 								    "        super(HuberMetric, self).update_state(metric, sample_weight)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
 								    "        return {**base_config, \"threshold\": self.threshold}        "
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "This class handles shapes better, and it also supports sample weights."
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 119,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          input_shape=input_shape),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 120,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.compile(loss=tf.keras.losses.Huber(2.0), optimizer=\"nadam\",\n",
 								    "              weighted_metrics=[HuberMetric(2.0)])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 121,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 898us/step - loss: 0.3272 - HuberMetric: 0.6594\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 892us/step - loss: 0.1449 - HuberMetric: 0.2919\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "np.random.seed(42)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "sample_weight = np.random.rand(len(y_train))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "history = model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "                    sample_weight=sample_weight)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 122,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "(0.3272010087966919, 0.3272010869771911)"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 122,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "(history.history[\"loss\"][0],\n",
 								    " history.history[\"HuberMetric\"][0] * sample_weight.mean())"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 123,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric_v2/assets\n"
 								     ]
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_metric_v2/assets\n"
 								     ]
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_model_with_a_custom_metric_v2\")"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 124,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model = tf.keras.models.load_model(\"my_model_with_a_custom_metric_v2\",\n",
 								    "                                   custom_objects={\"HuberMetric\": HuberMetric})"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 125,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 970us/step - loss: 0.2442 - HuberMetric: 0.2442\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 857us/step - loss: 0.2184 - HuberMetric: 0.2184\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19c576e90>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 125,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=2)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 126,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "2.0"
 								      ]
 								     },
 								     "execution_count": 126,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								    "model.metrics[-1].threshold"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Custom Layers"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 127,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "exponential_layer = tf.keras.layers.Lambda(lambda x: tf.exp(x))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 128,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(3,), dtype=float32, numpy=array([0.36787945, 1.        , 2.7182817 ], dtype=float32)>"
 								      ]
 								     },
 								     "execution_count": 128,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – like all layers, it can be used as a function:\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "exponential_layer([-1., 0., 1.])"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Adding an exponential layer at the output of a regression model can be useful if the values to predict are positive and with very different scales (e.g., 0.001, 10., 10000)."
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 129,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.7784 - val_loss: 0.4393\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 891us/step - loss: 0.5702 - val_loss: 0.4094\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 3/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.4431 - val_loss: 0.3760\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 4/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 921us/step - loss: 0.4984 - val_loss: 0.3785\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 5/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 943us/step - loss: 0.3966 - val_loss: 0.3633\n",
 								      "162/162 [==============================] - 0s 631us/step - loss: 0.3781\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "0.3781099021434784"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 129,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
 								    "    tf.keras.layers.Dense(30, activation=\"relu\", input_shape=input_shape),\n",
 								    "    tf.keras.layers.Dense(1),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    exponential_layer\n",
 								    "])\n",
-												Update libraries to latest version, including TensorFlow 2.4.1 and Scikit-Learn 0.24.1

											
										
										
											2021-02-14 03:02:09 +01:00
+								    "model.compile(loss=\"mse\", optimizer=\"sgd\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=5,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))\n",
 								    "model.evaluate(X_test_scaled, y_test)"
 								   ]
 								  },
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Alternatively, it's often preferable to replace the targets with the logarithm of the targets (and use no activation function in the output layer)."
 								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 130,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class MyDense(tf.keras.layers.Layer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, units, activation=None, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
 								    "        self.units = units\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        self.activation = tf.keras.activations.get(activation)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
 								    "    def build(self, batch_input_shape):\n",
 								    "        self.kernel = self.add_weight(\n",
 								    "            name=\"kernel\", shape=[batch_input_shape[-1], self.units],\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "            initializer=\"he_normal\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        self.bias = self.add_weight(\n",
 								    "            name=\"bias\", shape=[self.units], initializer=\"zeros\")\n",
 								    "\n",
 								    "    def call(self, X):\n",
 								    "        return self.activation(X @ self.kernel + self.bias)\n",
 								    "\n",
 								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
 								    "        return {**base_config, \"units\": self.units,\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "                \"activation\": tf.keras.activations.serialize(self.activation)}"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 131,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 3.1183 - val_loss: 6.9549\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.8702 - val_loss: 3.2627\n",
 								      "162/162 [==============================] - 0s 718us/step - loss: 0.7039\n",
 								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_layer/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "INFO:tensorflow:Assets written to: my_model_with_a_custom_layer/assets\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows that a custom layer can be used normally\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    MyDense(30, activation=\"relu\", input_shape=input_shape),\n",
 								    "    MyDense(1)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.evaluate(X_test_scaled, y_test)\n",
 								    "model.save(\"my_model_with_a_custom_layer\")"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 132,
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 0.5945 - val_loss: 0.5318\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.4712 - val_loss: 0.5751\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19cbf39a0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 132,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to load a model with a custom layer\n",
 								    "model = tf.keras.models.load_model(\"my_model_with_a_custom_layer\",\n",
 								    "                                   custom_objects={\"MyDense\": MyDense})\n",
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 133,
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "class MyMultiLayer(tf.keras.layers.Layer):\n",
 								    "    def call(self, X):\n",
 								    "        X1, X2 = X\n",
 								    "        print(\"X1.shape: \", X1.shape ,\" X2.shape: \", X2.shape)  # extra code\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "        return X1 + X2, X1 * X2, X1 / X2"
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   ]
 								  },
-												Add explanations for the models using the custom layers

											
										
										
											2021-07-01 03:19:38 +02:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Our custom layer can be called using the functional API like this:"
-												Add explanations for the models using the custom layers

											
										
										
											2021-07-01 03:19:38 +02:00
+								   ]
 								  },
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 134,
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "X1.shape:  (None, 2)  X2.shape:  (None, 2)\n"
 								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "(<KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>,\n",
 								       " <KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>,\n",
 								       " <KerasTensor: shape=(None, 2) dtype=float32 (created by layer 'my_multi_layer')>)"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 134,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – tests MyMultiLayer with symbolic inputs\n",
 								    "inputs1 = tf.keras.layers.Input(shape=[2])\n",
 								    "inputs2 = tf.keras.layers.Input(shape=[2])\n",
 								    "MyMultiLayer()((inputs1, inputs2))"
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Note that the `call()` method receives symbolic inputs, and it returns symbolic outputs. The shapes are only partially specified at this stage: we don't know the batch size, which is why the first dimension is `None`.\n",
 								    "\n",
 								    "We can also pass actual data to the custom layer:"
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 135,
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "X1.shape:  (2, 2)  X2.shape:  (2, 2)\n"
 								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
 								       "(<tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
 								       " array([[ 9., 18.],\n",
 								       "        [ 6., 10.]], dtype=float32)>,\n",
 								       " <tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
 								       " array([[18., 72.],\n",
 								       "        [ 8., 21.]], dtype=float32)>,\n",
 								       " <tf.Tensor: shape=(2, 2), dtype=float32, numpy=\n",
 								       " array([[0.5      , 0.5      ],\n",
 								       "        [0.5      , 2.3333333]], dtype=float32)>)"
 								      ]
 								     },
 								     "execution_count": 135,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – tests MyMultiLayer with actual data \n",
 								    "X1, X2 = np.array([[3., 6.], [2., 7.]]), np.array([[6., 12.], [4., 3.]]) \n",
 								    "MyMultiLayer()((X1, X2))"
-												Chapter 12 Multi Layer Example

											
										
										
											2021-06-24 04:03:01 +02:00
+								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Add explanations for the models using the custom layers

											
										
										
											2021-07-01 03:19:38 +02:00
+								    "Now let's create a layer with a different behavior during training and testing:"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 136,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "class MyGaussianNoise(tf.keras.layers.Layer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, stddev, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
 								    "        self.stddev = stddev\n",
 								    "\n",
 								    "    def call(self, X, training=None):\n",
 								    "        if training:\n",
 								    "            noise = tf.random.normal(tf.shape(X), stddev=self.stddev)\n",
 								    "            return X + noise\n",
 								    "        else:\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "            return X"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Add explanations for the models using the custom layers

											
										
										
											2021-07-01 03:19:38 +02:00
+								   "cell_type": "markdown",
-												Adding example Gaussian Noise model

											
										
										
											2021-06-24 04:14:34 +02:00
+								   "metadata": {},
 								   "source": [
-												Add explanations for the models using the custom layers

											
										
										
											2021-07-01 03:19:38 +02:00
+								    "Here's a simple model that uses this custom layer:"
-												Adding example Gaussian Noise model

											
										
										
											2021-06-24 04:14:34 +02:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 137,
-												Adding example Gaussian Noise model

											
										
										
											2021-06-24 04:14:34 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 2.2220 - val_loss: 25.1506\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 1.4104 - val_loss: 17.0415\n",
 								      "162/162 [==============================] - 0s 655us/step - loss: 1.1059\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "1.1058681011199951"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 137,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Adding example Gaussian Noise model

											
										
										
											2021-06-24 04:14:34 +02:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – tests MyGaussianNoise\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    MyGaussianNoise(stddev=1.0, input_shape=input_shape),\n",
 								    "    tf.keras.layers.Dense(30, activation=\"relu\",\n",
 								    "                          kernel_initializer=\"he_normal\"),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))\n",
 								    "model.evaluate(X_test_scaled, y_test)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Custom Models"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 138,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class ResidualBlock(tf.keras.layers.Layer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, n_layers, n_neurons, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        self.hidden = [tf.keras.layers.Dense(n_neurons, activation=\"relu\",\n",
 								    "                                             kernel_initializer=\"he_normal\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "                       for _ in range(n_layers)]\n",
 								    "\n",
 								    "    def call(self, inputs):\n",
 								    "        Z = inputs\n",
 								    "        for layer in self.hidden:\n",
 								    "            Z = layer(Z)\n",
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								    "        return inputs + Z"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 139,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class ResidualRegressor(tf.keras.Model):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, output_dim, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        self.hidden1 = tf.keras.layers.Dense(30, activation=\"relu\",\n",
 								    "                                             kernel_initializer=\"he_normal\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        self.block1 = ResidualBlock(2, 30)\n",
 								    "        self.block2 = ResidualBlock(2, 30)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        self.out = tf.keras.layers.Dense(output_dim)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
 								    "    def call(self, inputs):\n",
 								    "        Z = self.hidden1(inputs)\n",
 								    "        for _ in range(1 + 3):\n",
 								    "            Z = self.block1(Z)\n",
 								    "        Z = self.block2(Z)\n",
-												Fix some issues with TF 2.2 breaking changes

											
										
										
											2020-04-02 01:52:31 +02:00
+								    "        return self.out(Z)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 140,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 2s 1ms/step - loss: 32.7847\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 1.3612\n",
 								      "162/162 [==============================] - 0s 713us/step - loss: 1.1603\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "INFO:tensorflow:Assets written to: my_custom_model/assets\n"
 								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
 								      "INFO:tensorflow:Assets written to: my_custom_model/assets\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows that the model can be used normally\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model = ResidualRegressor(1)\n",
 								    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "history = model.fit(X_train_scaled, y_train, epochs=2)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "score = model.evaluate(X_test_scaled, y_test)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "model.save(\"my_custom_model\")"
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 141,
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 2s 1ms/step - loss: 1.3451\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.7928\n",
 								      "1/1 [==============================] - 0s 76ms/step\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "array([[1.1431919],\n",
 								       "       [1.0584592],\n",
 								       "       [4.71127  ]], dtype=float32)"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 141,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – the model can be loaded and you can continue training or use it\n",
 								    "#              to make predictions\n",
 								    "model = tf.keras.models.load_model(\"my_custom_model\")\n",
 								    "history = model.fit(X_train_scaled, y_train, epochs=2)\n",
 								    "model.predict(X_test_scaled[:3])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "We could have defined the model using the sequential API instead:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 142,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "block1 = ResidualBlock(2, 30)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    tf.keras.layers.Dense(30, activation=\"relu\",\n",
 								    "                          kernel_initializer=\"he_normal\"),\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    block1, block1, block1, block1,\n",
 								    "    ResidualBlock(2, 30),\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "    tf.keras.layers.Dense(1)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Losses and Metrics Based on Model Internals"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 143,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class ReconstructingRegressor(tf.keras.Model):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, output_dim, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        self.hidden = [tf.keras.layers.Dense(30, activation=\"relu\",\n",
 								    "                                             kernel_initializer=\"he_normal\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "                       for _ in range(5)]\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        self.out = tf.keras.layers.Dense(output_dim)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        self.reconstruction_mean = tf.keras.metrics.Mean(\n",
 								    "            name=\"reconstruction_error\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												TF mostly fixed an issue so remove workaround for ReconstructingRegressor

											
										
										
											2021-10-07 08:08:15 +02:00
+								    "    def build(self, batch_input_shape):\n",
 								    "        n_inputs = batch_input_shape[-1]\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        self.reconstruct = tf.keras.layers.Dense(n_inputs)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "    def call(self, inputs, training=None):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        Z = inputs\n",
 								    "        for layer in self.hidden:\n",
 								    "            Z = layer(Z)\n",
 								    "        reconstruction = self.reconstruct(Z)\n",
 								    "        recon_loss = tf.reduce_mean(tf.square(reconstruction - inputs))\n",
 								    "        self.add_loss(0.05 * recon_loss)\n",
-												Update libraries to latest version, including TensorFlow 2.4.1 and Scikit-Learn 0.24.1

											
										
										
											2021-02-14 03:02:09 +01:00
+								    "        if training:\n",
 								    "            result = self.reconstruction_mean(recon_loss)\n",
 								    "            self.add_metric(result)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        return self.out(Z)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 144,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 2s 1ms/step - loss: 0.8198 - reconstruction_error: 1.0892\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.4778 - reconstruction_error: 0.5583\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 3/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.4419 - reconstruction_error: 0.4227\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 4/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.3852 - reconstruction_error: 0.3587\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 5/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.3714 - reconstruction_error: 0.3245\n",
 								      "162/162 [==============================] - 0s 658us/step\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model = ReconstructingRegressor(1)\n",
 								    "model.compile(loss=\"mse\", optimizer=\"nadam\")\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "history = model.fit(X_train_scaled, y_train, epochs=5)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "y_pred = model.predict(X_test_scaled)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## Computing Gradients Using Autodiff"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 145,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "def f(w1, w2):\n",
 								    "    return 3 * w1 ** 2 + 2 * w1 * w2"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 146,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "36.000003007075065"
 								      ]
 								     },
 								     "execution_count": 146,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "w1, w2 = 5, 3\n",
 								    "eps = 1e-6\n",
 								    "(f(w1 + eps, w2) - f(w1, w2)) / eps"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 147,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "10.000000003174137"
 								      ]
 								     },
 								     "execution_count": 147,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "(f(w1, w2 + eps) - f(w1, w2)) / eps"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 148,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "w1, w2 = tf.Variable(5.), tf.Variable(3.)\n",
 								    "with tf.GradientTape() as tape:\n",
 								    "    z = f(w1, w2)\n",
 								    "\n",
 								    "gradients = tape.gradient(z, [w1, w2])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 149,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
 								      ]
 								     },
 								     "execution_count": 149,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "gradients"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 150,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "A non-persistent GradientTape can only be used to compute one set of gradients (or jacobians)\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "with tf.GradientTape() as tape:\n",
 								    "    z = f(w1, w2)\n",
 								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "dz_dw1 = tape.gradient(z, w1)  # returns tensor 36.0\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "try:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    dz_dw2 = tape.gradient(z, w2)  # raises a RuntimeError!\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "except RuntimeError as ex:\n",
 								    "    print(ex)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 151,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "with tf.GradientTape(persistent=True) as tape:\n",
 								    "    z = f(w1, w2)\n",
 								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "dz_dw1 = tape.gradient(z, w1)  # returns tensor 36.0\n",
 								    "dz_dw2 = tape.gradient(z, w2)  # returns tensor 10.0, works fine now!\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "del tape"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 152,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "(<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>)"
 								      ]
 								     },
 								     "execution_count": 152,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "dz_dw1, dz_dw2"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 153,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "c1, c2 = tf.constant(5.), tf.constant(3.)\n",
 								    "with tf.GradientTape() as tape:\n",
 								    "    z = f(c1, c2)\n",
 								    "\n",
 								    "gradients = tape.gradient(z, [c1, c2])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 154,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[None, None]"
 								      ]
 								     },
 								     "execution_count": 154,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "gradients"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 155,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "with tf.GradientTape() as tape:\n",
 								    "    tape.watch(c1)\n",
 								    "    tape.watch(c2)\n",
 								    "    z = f(c1, c2)\n",
 								    "\n",
 								    "gradients = tape.gradient(z, [c1, c2])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 156,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
 								      ]
 								     },
 								     "execution_count": 156,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "gradients"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 157,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=136.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=30.0>]"
 								      ]
 								     },
 								     "execution_count": 157,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – if given a vector, tape.gradient() will compute the gradient of\n",
 								    "#              the vector's sum.\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "with tf.GradientTape() as tape:\n",
 								    "    z1 = f(w1, w2 + 2.)\n",
 								    "    z2 = f(w1, w2 + 5.)\n",
 								    "    z3 = f(w1, w2 + 7.)\n",
 								    "\n",
 								    "tape.gradient([z1, z2, z3], [w1, w2])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 158,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=136.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=30.0>]"
 								      ]
 								     },
 								     "execution_count": 158,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows that we get the same result as the previous cell\n",
 								    "with tf.GradientTape() as tape:\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    z1 = f(w1, w2 + 2.)\n",
 								    "    z2 = f(w1, w2 + 5.)\n",
 								    "    z3 = f(w1, w2 + 7.)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    z = z1 + z2 + z3\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tape.gradient(z, [w1, w2])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 159,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to compute the jacobians and the hessians\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "with tf.GradientTape(persistent=True) as hessian_tape:\n",
 								    "    with tf.GradientTape() as jacobian_tape:\n",
 								    "        z = f(w1, w2)\n",
 								    "    jacobians = jacobian_tape.gradient(z, [w1, w2])\n",
 								    "hessians = [hessian_tape.gradient(jacobian, [w1, w2])\n",
 								    "            for jacobian in jacobians]\n",
 								    "del hessian_tape"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 160,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=36.0>,\n",
 								       " <tf.Tensor: shape=(), dtype=float32, numpy=10.0>]"
 								      ]
 								     },
 								     "execution_count": 160,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "jacobians"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 161,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[[<tf.Tensor: shape=(), dtype=float32, numpy=6.0>,\n",
 								       "  <tf.Tensor: shape=(), dtype=float32, numpy=2.0>],\n",
 								       " [<tf.Tensor: shape=(), dtype=float32, numpy=2.0>, None]]"
 								      ]
 								     },
 								     "execution_count": 161,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "hessians"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 162,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "def f(w1, w2):\n",
 								    "    return 3 * w1 ** 2 + tf.stop_gradient(2 * w1 * w2)\n",
 								    "\n",
 								    "with tf.GradientTape() as tape:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    z = f(w1, w2)  # same result as without stop_gradient()\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "gradients = tape.gradient(z, [w1, w2])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 163,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=30.0>, None]"
 								      ]
 								     },
 								     "execution_count": 163,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "gradients"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 164,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor: shape=(), dtype=float32, numpy=inf>]"
 								      ]
 								     },
 								     "execution_count": 164,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "x = tf.Variable(1e-50)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "with tf.GradientTape() as tape:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    z = tf.sqrt(x)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
 								    "tape.gradient(z, [x])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 165,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=30.0>"
 								      ]
 								     },
 								     "execution_count": 165,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tf.math.log(tf.exp(tf.constant(30., dtype=tf.float32)) + 1.)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 166,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "[<tf.Tensor: shape=(1,), dtype=float32, numpy=array([nan], dtype=float32)>]"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 166,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "x = tf.Variable([1.0e30])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "with tf.GradientTape() as tape:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    z = my_softplus(x)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "tape.gradient(z, [x])"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 167,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "def my_softplus(z):\n",
 								    "    return tf.math.log(1 + tf.exp(-tf.abs(z))) + tf.maximum(0., z)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Here is the proof that this equation is equal to log(1 + exp(_z_)):\n",
 								    "* softplus(_z_) = log(1 + exp(_z_))\n",
 								    "* softplus(_z_) = log(1 + exp(_z_)) - log(exp(_z_)) + log(exp(_z_)) ; **just adding and subtracting the same value**\n",
 								    "* softplus(_z_) = log\\[(1 + exp(_z_)) / exp(_z_)\\] + log(exp(_z_)) ; **since log(_a_) - log(_b_) = log(_a_ / _b_)**\n",
 								    "* softplus(_z_) = log\\[(1 + exp(_z_)) / exp(_z_)\\] + _z_ ; **since log(exp(_z_)) = _z_**\n",
 								    "* softplus(_z_) = log\\[1 / exp(_z_) + exp(_z_) / exp(_z_)\\] + _z_ ; **since (1 + _a_) / _b_ = 1 / _b_ + _a_ / _b_**\n",
 								    "* softplus(_z_) = log\\[exp(–_z_) + 1\\] + _z_ ; **since 1 / exp(_z_) = exp(–z), and exp(_z_) / exp(_z_) = 1**\n",
 								    "* softplus(_z_) = softplus(–_z_) + _z_ ; **we recognize the definition at the top, but with –_z_**\n",
 								    "* softplus(_z_) = softplus(–|_z_|) + max(0, _z_) ; **if you consider both cases, _z_ < 0 or _z_ ≥ 0, you will see that this works**"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 168,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "@tf.custom_gradient\n",
 								    "def my_softplus(z):\n",
 								    "    def my_softplus_gradients(grads):  # grads = backprop'ed from upper layers\n",
 								    "        return grads * (1 - 1 / (1 + tf.exp(z)))  # stable grads of softplus\n",
 								    "\n",
 								    "    result = tf.math.log(1 + tf.exp(-tf.abs(z))) + tf.maximum(0., z)\n",
 								    "    return result, my_softplus_gradients"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 169,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "(<tf.Tensor: shape=(1,), dtype=float32, numpy=array([1000.], dtype=float32)>,\n",
 								       " [<tf.Tensor: shape=(1,), dtype=float32, numpy=array([1.], dtype=float32)>])"
 								      ]
 								     },
 								     "execution_count": 169,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows that the function is now stable, as well as its gradients\n",
 								    "x = tf.Variable([1000.])\n",
 								    "with tf.GradientTape() as tape:\n",
 								    "    z = my_softplus(x)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "z, tape.gradient(z, [x])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "cell_type": "markdown",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## Custom Training Loops"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 170,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)  # extra code – to ensure reproducibility\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "l2_reg = tf.keras.regularizers.l2(0.05)\n",
 								    "model = tf.keras.models.Sequential([\n",
 								    "    tf.keras.layers.Dense(30, activation=\"relu\", kernel_initializer=\"he_normal\",\n",
 								    "                          kernel_regularizer=l2_reg),\n",
 								    "    tf.keras.layers.Dense(1, kernel_regularizer=l2_reg)\n",
 								    "])"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 171,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "def random_batch(X, y, batch_size=32):\n",
 								    "    idx = np.random.randint(len(X), size=batch_size)\n",
 								    "    return X[idx], y[idx]"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 172,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "def print_status_bar(step, total, loss, metrics=None):\n",
 								    "    metrics = \" - \".join([f\"{m.name}: {m.result():.4f}\"\n",
 								    "                          for m in [loss] + (metrics or [])])\n",
 								    "    end = \"\" if step < total else \"\\n\"\n",
 								    "    print(f\"\\r{step}/{total} - \" + metrics, end=end)"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 173,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 174,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "n_epochs = 5\n",
 								    "batch_size = 32\n",
 								    "n_steps = len(X_train) // batch_size\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "optimizer = tf.keras.optimizers.SGD(learning_rate=0.01)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "loss_fn = tf.keras.losses.mean_squared_error\n",
 								    "mean_loss = tf.keras.metrics.Mean()\n",
 								    "metrics = [tf.keras.metrics.MeanAbsoluteError()]"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 175,
-												Large change: replace os.path with pathlib, move to Python 3.7

											
										
										
											2021-10-15 10:46:27 +02:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "362/362 - mean: 3.5419 - mean_absolute_error: 0.6640\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "362/362 - mean: 1.8693 - mean_absolute_error: 0.5431\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 3/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "362/362 - mean: 1.1428 - mean_absolute_error: 0.5030\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 4/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "362/362 - mean: 0.8501 - mean_absolute_error: 0.4977\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 5/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "362/362 - mean: 0.7280 - mean_absolute_error: 0.5014\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "for epoch in range(1, n_epochs + 1):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    print(f\"Epoch {epoch}/{n_epochs}\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    for step in range(1, n_steps + 1):\n",
 								    "        X_batch, y_batch = random_batch(X_train_scaled, y_train)\n",
 								    "        with tf.GradientTape() as tape:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "            y_pred = model(X_batch, training=True)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "            main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
 								    "            loss = tf.add_n([main_loss] + model.losses)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        gradients = tape.gradient(loss, model.trainable_variables)\n",
 								    "        optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
 								    "        # extra code – if your model has variable constraints\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        for variable in model.variables:\n",
 								    "            if variable.constraint is not None:\n",
 								    "                variable.assign(variable.constraint(variable))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        mean_loss(loss)\n",
 								    "        for metric in metrics:\n",
 								    "            metric(y_batch, y_pred)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "\n",
 								    "        print_status_bar(step, n_steps, mean_loss, metrics)\n",
 								    "\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    for metric in [mean_loss] + metrics:\n",
 								    "        metric.reset_states()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 176,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "28534c4a7baf4b78a8a9f1db10024cfd",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "cd7c0a89c62f476db08f755e6e4f1178",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 1/5:   0%|          | 0/362 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "5866293693b1455584e6a2e28811692a",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 2/5:   0%|          | 0/362 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "84cf94014b644e07b649063016221d3f",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 3/5:   0%|          | 0/362 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "21e3803f4d4249049efc0b725c9bd23f",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 4/5:   0%|          | 0/362 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "c8c0aa7115374ed8891175bafc6f7d0d",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 5/5:   0%|          | 0/362 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to use the tqdm package to display nice progress bars\n",
 								    "\n",
 								    "from tqdm.notebook import trange\n",
 								    "from collections import OrderedDict\n",
 								    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
 								    "    for epoch in epochs:\n",
 								    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
 								    "            for step in steps:\n",
 								    "                X_batch, y_batch = random_batch(X_train_scaled, y_train)\n",
 								    "                with tf.GradientTape() as tape:\n",
 								    "                    y_pred = model(X_batch)\n",
 								    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
 								    "                    loss = tf.add_n([main_loss] + model.losses)\n",
 								    "\n",
 								    "                gradients = tape.gradient(loss, model.trainable_variables)\n",
 								    "                optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
 								    "\n",
 								    "                for variable in model.variables:\n",
 								    "                    if variable.constraint is not None:\n",
 								    "                        variable.assign(variable.constraint(variable))\n",
 								    "\n",
 								    "                status = OrderedDict()\n",
 								    "                mean_loss(loss)\n",
 								    "                status[\"loss\"] = mean_loss.result().numpy()\n",
 								    "                for metric in metrics:\n",
 								    "                    metric(y_batch, y_pred)\n",
 								    "                    status[metric.name] = metric.result().numpy()\n",
 								    "\n",
 								    "                steps.set_postfix(status)\n",
 								    "\n",
 								    "        for metric in [mean_loss] + metrics:\n",
 								    "            metric.reset_states()"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## TensorFlow Functions"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 177,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "def cube(x):\n",
 								    "    return x ** 3"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 178,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "8"
 								      ]
 								     },
 								     "execution_count": 178,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "cube(2)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 179,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
 								      ]
 								     },
 								     "execution_count": 179,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "cube(tf.constant(2.0))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 180,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<tensorflow.python.eager.polymorphic_function.polymorphic_function.Function at 0x19db349d0>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 180,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "tf_cube = tf.function(cube)\n",
 								    "tf_cube"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 181,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=8>"
 								      ]
 								     },
 								     "execution_count": 181,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "tf_cube(2)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 182,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
 								      ]
 								     },
 								     "execution_count": 182,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "tf_cube(tf.constant(2.0))"
 								   ]
 								  },
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								  {
 								   "cell_type": "code",
 								   "execution_count": 183,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "@tf.function\n",
 								    "def tf_cube(x):\n",
 								    "    return x ** 3"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "**Note:** the rest of the code in this section is in appendix D."
 								   ]
 								  },
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### TF Functions and Concrete Functions"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 184,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<ConcreteFunction tf_cube(x) at 0x19F90F400>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 184,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function = tf_cube.get_concrete_function(tf.constant(2.0))\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "concrete_function"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 185,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
 								      ]
 								     },
 								     "execution_count": 185,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function(tf.constant(2.0))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 186,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "True"
 								      ]
 								     },
 								     "execution_count": 186,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function is tf_cube.get_concrete_function(tf.constant(2.0))"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Exploring Function Definitions and Graphs"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 187,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "PyGraph<6956689888>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 187,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function.graph"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 188,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Operation 'x' type=Placeholder>,\n",
 								       " <tf.Operation 'pow/y' type=Const>,\n",
 								       " <tf.Operation 'pow' type=Pow>,\n",
 								       " <tf.Operation 'Identity' type=Identity>]"
 								      ]
 								     },
 								     "execution_count": 188,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "ops = concrete_function.graph.get_operations()\n",
 								    "ops"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 189,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor 'x:0' shape=() dtype=float32>,\n",
 								       " <tf.Tensor 'pow/y:0' shape=() dtype=float32>]"
 								      ]
 								     },
 								     "execution_count": 189,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "pow_op = ops[2]\n",
 								    "list(pow_op.inputs)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 190,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Tensor 'pow:0' shape=() dtype=float32>]"
 								      ]
 								     },
 								     "execution_count": 190,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "pow_op.outputs"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 191,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Operation 'x' type=Placeholder>"
 								      ]
 								     },
 								     "execution_count": 191,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function.graph.get_operation_by_name('x')"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 192,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor 'Identity:0' shape=() dtype=float32>"
 								      ]
 								     },
 								     "execution_count": 192,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function.graph.get_tensor_by_name('Identity:0')"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 193,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "name: \"__inference_tf_cube_592407\"\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "input_arg {\n",
 								       "  name: \"x\"\n",
 								       "  type: DT_FLOAT\n",
 								       "}\n",
 								       "output_arg {\n",
 								       "  name: \"identity\"\n",
 								       "  type: DT_FLOAT\n",
 								       "}"
 								      ]
 								     },
 								     "execution_count": 193,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "concrete_function.function_def.signature"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### How TF Functions Trace Python Functions to Extract Their Computation Graphs"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 194,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "@tf.function\n",
 								    "def tf_cube(x):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    print(f\"x = {x}\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    return x ** 3"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 195,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "x = Tensor(\"x:0\", shape=(), dtype=float32)\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "result = tf_cube(tf.constant(2.0))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 196,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=float32, numpy=8.0>"
 								      ]
 								     },
 								     "execution_count": 196,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "result"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 197,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "x = 2\n"
 								     ]
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "result = tf_cube(2)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 198,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "x = 3\n"
 								     ]
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "result = tf_cube(3)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 199,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "x = Tensor(\"x:0\", shape=(1, 2), dtype=float32)\n"
 								     ]
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "result = tf_cube(tf.constant([[1., 2.]]))  # New shape: trace!"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 200,
 								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "x = Tensor(\"x:0\", shape=(2, 2), dtype=float32)\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "WARNING:tensorflow:5 out of the last 5 calls to <function tf_cube at 0x19f910c10> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "name": "stderr",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "WARNING:tensorflow:5 out of the last 5 calls to <function tf_cube at 0x19f910c10> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "source": [
 								    "result = tf_cube(tf.constant([[3., 4.], [5., 6.]]))  # New shape: trace!"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": 201,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "result = tf_cube(tf.constant([[7., 8.], [9., 10.]]))  # Same shape: no trace"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "It is also possible to specify a particular input signature:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 202,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "@tf.function(input_signature=[tf.TensorSpec([None, 28, 28], tf.float32)])\n",
 								    "def shrink(images):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    print(\"Tracing\", images)  # extra code to show when tracing happens\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    return images[:, ::2, ::2] # drop half the rows and columns"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 203,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 204,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Tracing Tensor(\"images:0\", shape=(None, 28, 28), dtype=float32)\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "img_batch_1 = tf.random.uniform(shape=[100, 28, 28])\n",
 								    "img_batch_2 = tf.random.uniform(shape=[50, 28, 28])\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "preprocessed_images = shrink(img_batch_1)  # Works fine, traces the function\n",
 								    "preprocessed_images = shrink(img_batch_2)  # Works fine, same concrete function"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 205,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "Binding inputs to tf.function `shrink` failed due to `Can not cast TensorSpec(shape=(2, 2, 2), dtype=tf.float32, name=None) to TensorSpec(shape=(None, 28, 28), dtype=tf.float32, name=None)`. Received args: (<tf.Tensor: shape=(2, 2, 2), dtype=float32, numpy=\n",
 								      "array([[[0.7413678 , 0.62854624],\n",
 								      "        [0.01738465, 0.3431449 ]],\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "       [[0.51063764, 0.3777541 ],\n",
 								      "        [0.07321596, 0.02137029]]], dtype=float32)>,) and kwargs: {} for signature: (images: TensorSpec(shape=(None, 28, 28), dtype=tf.float32, name=None)).\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "img_batch_3 = tf.random.uniform(shape=[2, 2, 2])\n",
 								    "try:\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "    preprocessed_images = shrink(img_batch_3)  # TypeError! Incompatible inputs\n",
 								    "except TypeError as ex:\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    print(ex)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Using Autograph To Capture Control Flow"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "A \"static\" `for` loop using `range()`:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 206,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "@tf.function\n",
 								    "def add_10(x):\n",
 								    "    for i in range(10):\n",
 								    "        x += 1\n",
 								    "    return x"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 207,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=15>"
 								      ]
 								     },
 								     "execution_count": 207,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "add_10(tf.constant(5))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 208,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Operation 'x' type=Placeholder>,\n",
 								       " <tf.Operation 'add/y' type=Const>,\n",
 								       " <tf.Operation 'add' type=AddV2>,\n",
 								       " <tf.Operation 'add_1/y' type=Const>,\n",
 								       " <tf.Operation 'add_1' type=AddV2>,\n",
 								       " <tf.Operation 'add_2/y' type=Const>,\n",
 								       " <tf.Operation 'add_2' type=AddV2>,\n",
 								       " <tf.Operation 'add_3/y' type=Const>,\n",
 								       " <tf.Operation 'add_3' type=AddV2>,\n",
 								       " <tf.Operation 'add_4/y' type=Const>,\n",
 								       " <tf.Operation 'add_4' type=AddV2>,\n",
 								       " <tf.Operation 'add_5/y' type=Const>,\n",
 								       " <tf.Operation 'add_5' type=AddV2>,\n",
 								       " <tf.Operation 'add_6/y' type=Const>,\n",
 								       " <tf.Operation 'add_6' type=AddV2>,\n",
 								       " <tf.Operation 'add_7/y' type=Const>,\n",
 								       " <tf.Operation 'add_7' type=AddV2>,\n",
 								       " <tf.Operation 'add_8/y' type=Const>,\n",
 								       " <tf.Operation 'add_8' type=AddV2>,\n",
 								       " <tf.Operation 'add_9/y' type=Const>,\n",
 								       " <tf.Operation 'add_9' type=AddV2>,\n",
 								       " <tf.Operation 'Identity' type=Identity>]"
 								      ]
 								     },
 								     "execution_count": 208,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "add_10.get_concrete_function(tf.constant(5)).graph.get_operations()"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "A \"dynamic\" loop using `tf.while_loop()`:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 209,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to use tf.while_loop (usually @tf.function is simpler)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "@tf.function\n",
 								    "def add_10(x):\n",
 								    "    condition = lambda i, x: tf.less(i, 10)\n",
 								    "    body = lambda i, x: (tf.add(i, 1), tf.add(x, 1))\n",
 								    "    final_i, final_x = tf.while_loop(condition, body, [tf.constant(0), x])\n",
 								    "    return final_x"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 210,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=15>"
 								      ]
 								     },
 								     "execution_count": 210,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "add_10(tf.constant(5))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 211,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Operation 'x' type=Placeholder>,\n",
 								       " <tf.Operation 'Const' type=Const>,\n",
 								       " <tf.Operation 'while/maximum_iterations' type=Const>,\n",
 								       " <tf.Operation 'while/loop_counter' type=Const>,\n",
 								       " <tf.Operation 'while' type=StatelessWhile>,\n",
 								       " <tf.Operation 'Identity' type=Identity>]"
 								      ]
 								     },
 								     "execution_count": 211,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "add_10.get_concrete_function(tf.constant(5)).graph.get_operations()"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "A \"dynamic\" `for` loop using `tf.range()` (captured by autograph):"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 212,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "@tf.function\n",
 								    "def add_10(x):\n",
 								    "    for i in tf.range(10):\n",
 								    "        x = x + 1\n",
 								    "    return x"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 213,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "[<tf.Operation 'x' type=Placeholder>,\n",
 								       " <tf.Operation 'range/start' type=Const>,\n",
 								       " <tf.Operation 'range/limit' type=Const>,\n",
 								       " <tf.Operation 'range/delta' type=Const>,\n",
 								       " <tf.Operation 'range' type=Range>,\n",
 								       " <tf.Operation 'sub' type=Sub>,\n",
 								       " <tf.Operation 'floordiv' type=FloorDiv>,\n",
 								       " <tf.Operation 'mod' type=FloorMod>,\n",
 								       " <tf.Operation 'zeros_like' type=Const>,\n",
 								       " <tf.Operation 'NotEqual' type=NotEqual>,\n",
 								       " <tf.Operation 'Cast' type=Cast>,\n",
 								       " <tf.Operation 'add' type=AddV2>,\n",
 								       " <tf.Operation 'zeros_like_1' type=Const>,\n",
 								       " <tf.Operation 'Maximum' type=Maximum>,\n",
 								       " <tf.Operation 'while/maximum_iterations' type=Const>,\n",
 								       " <tf.Operation 'while/loop_counter' type=Const>,\n",
 								       " <tf.Operation 'while' type=StatelessWhile>,\n",
 								       " <tf.Operation 'Identity' type=Identity>]"
 								      ]
 								     },
 								     "execution_count": 213,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "add_10.get_concrete_function(tf.constant(0)).graph.get_operations()"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### Handling Variables and Other Resources in TF Functions"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 214,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
 								      ]
 								     },
 								     "execution_count": 214,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "counter = tf.Variable(0)\n",
 								    "\n",
 								    "@tf.function\n",
 								    "def increment(counter, c=1):\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    return counter.assign_add(c)\n",
 								    "\n",
 								    "increment(counter)  # counter is now equal to 1\n",
 								    "increment(counter)  # counter is now equal to 2"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 215,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "name: \"counter\"\n",
 								       "type: DT_RESOURCE"
 								      ]
 								     },
 								     "execution_count": 215,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "function_def = increment.get_concrete_function(counter).function_def\n",
 								    "function_def.signature.input_arg[0]"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 216,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "counter = tf.Variable(0)\n",
 								    "\n",
 								    "@tf.function\n",
 								    "def increment(c=1):\n",
 								    "    return counter.assign_add(c)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 217,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
 								      ]
 								     },
 								     "execution_count": 217,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "increment()\n",
 								    "increment()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 218,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "name: \"assignaddvariableop_resource\"\n",
 								       "type: DT_RESOURCE"
 								      ]
 								     },
 								     "execution_count": 218,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "function_def = increment.get_concrete_function().function_def\n",
 								    "function_def.signature.input_arg[0]"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 219,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "class Counter:\n",
 								    "    def __init__(self):\n",
 								    "        self.counter = tf.Variable(0)\n",
 								    "\n",
 								    "    @tf.function\n",
 								    "    def increment(self, c=1):\n",
 								    "        return self.counter.assign_add(c)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 220,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<tf.Tensor: shape=(), dtype=int32, numpy=2>"
 								      ]
 								     },
 								     "execution_count": 220,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "c = Counter()\n",
 								    "c.increment()\n",
 								    "c.increment()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 221,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {
 								    "scrolled": true
 								   },
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "def tf__add(x):\n",
 								      "    with ag__.FunctionScope('add_10', 'fscope', ag__.ConversionOptions(recursive=True, user_requested=True, optional_features=(), internal_convert_user_code=True)) as fscope:\n",
 								      "        do_return = False\n",
 								      "        retval_ = ag__.UndefinedReturnValue()\n",
 								      "\n",
 								      "        def get_state():\n",
 								      "            return (x,)\n",
 								      "\n",
 								      "        def set_state(vars_):\n",
 								      "            nonlocal x\n",
 								      "            (x,) = vars_\n",
 								      "\n",
 								      "        def loop_body(itr):\n",
 								      "            nonlocal x\n",
 								      "            i = itr\n",
 								      "            x = ag__.ld(x)\n",
 								      "            x += 1\n",
 								      "        i = ag__.Undefined('i')\n",
 								      "        ag__.for_stmt(ag__.converted_call(ag__.ld(tf).range, (10,), None, fscope), None, loop_body, get_state, set_state, ('x',), {'iterate_names': 'i'})\n",
 								      "        try:\n",
 								      "            do_return = True\n",
 								      "            retval_ = ag__.ld(x)\n",
 								      "        except:\n",
 								      "            do_return = False\n",
 								      "            raise\n",
 								      "        return fscope.ret(retval_, do_return)\n",
 								      "\n"
 								     ]
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "@tf.function\n",
 								    "def add_10(x):\n",
 								    "    for i in tf.range(10):\n",
 								    "        x += 1\n",
 								    "    return x\n",
 								    "\n",
-												Update libraries to latest version, including TensorFlow 2.4.1 and Scikit-Learn 0.24.1

											
										
										
											2021-02-14 03:02:09 +01:00
+								    "print(tf.autograph.to_code(add_10.python_function))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 222,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "# extra code – shows how to display the autograph code with syntax highlighting\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "def display_tf_code(func):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    from IPython.display import display, Markdown\n",
 								    "    if hasattr(func, \"python_function\"):\n",
 								    "        func = func.python_function\n",
-												Work around issue with custom metric persistence

											
										
										
											2019-11-06 04:36:21 +01:00
+								    "    code = tf.autograph.to_code(func)\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "    display(Markdown(f'```python\\n{code}\\n```'))"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 223,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/markdown": [
 								       "```python\n",
 								       "def tf__add(x):\n",
 								       "    with ag__.FunctionScope('add_10', 'fscope', ag__.ConversionOptions(recursive=True, user_requested=True, optional_features=(), internal_convert_user_code=True)) as fscope:\n",
 								       "        do_return = False\n",
 								       "        retval_ = ag__.UndefinedReturnValue()\n",
 								       "\n",
 								       "        def get_state():\n",
 								       "            return (x,)\n",
 								       "\n",
 								       "        def set_state(vars_):\n",
 								       "            nonlocal x\n",
 								       "            (x,) = vars_\n",
 								       "\n",
 								       "        def loop_body(itr):\n",
 								       "            nonlocal x\n",
 								       "            i = itr\n",
 								       "            x = ag__.ld(x)\n",
 								       "            x += 1\n",
 								       "        i = ag__.Undefined('i')\n",
 								       "        ag__.for_stmt(ag__.converted_call(ag__.ld(tf).range, (10,), None, fscope), None, loop_body, get_state, set_state, ('x',), {'iterate_names': 'i'})\n",
 								       "        try:\n",
 								       "            do_return = True\n",
 								       "            retval_ = ag__.ld(x)\n",
 								       "        except:\n",
 								       "            do_return = False\n",
 								       "            raise\n",
 								       "        return fscope.ret(retval_, do_return)\n",
 								       "\n",
 								       "```"
 								      ],
 								      "text/plain": [
 								       "<IPython.core.display.Markdown object>"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "display_tf_code(add_10)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## Using TF Functions with tf.keras (or Not)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "By default, tf.keras will automatically convert your custom code into TF Functions, no need to use\n",
 								    "`tf.function()`:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 224,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "# Custom loss function\n",
 								    "def my_mse(y_true, y_pred):\n",
 								    "    print(\"Tracing loss my_mse()\")\n",
 								    "    return tf.reduce_mean(tf.square(y_pred - y_true))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 225,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "# Custom metric function\n",
 								    "def my_mae(y_true, y_pred):\n",
 								    "    print(\"Tracing metric my_mae()\")\n",
 								    "    return tf.reduce_mean(tf.abs(y_pred - y_true))"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 226,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "# Custom layer\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class MyDense(tf.keras.layers.Layer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, units, activation=None, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
 								    "        self.units = units\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        self.activation = tf.keras.activations.get(activation)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
 								    "    def build(self, input_shape):\n",
 								    "        self.kernel = self.add_weight(name='kernel', \n",
 								    "                                      shape=(input_shape[1], self.units),\n",
 								    "                                      initializer='uniform',\n",
 								    "                                      trainable=True)\n",
 								    "        self.biases = self.add_weight(name='bias', \n",
 								    "                                      shape=(self.units,),\n",
 								    "                                      initializer='zeros',\n",
 								    "                                      trainable=True)\n",
 								    "\n",
 								    "    def call(self, X):\n",
 								    "        print(\"Tracing MyDense.call()\")\n",
 								    "        return self.activation(X @ self.kernel + self.biases)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 227,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 228,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "# Custom model\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class MyModel(tf.keras.Model):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
 								    "        self.hidden1 = MyDense(30, activation=\"relu\")\n",
 								    "        self.hidden2 = MyDense(30, activation=\"relu\")\n",
 								    "        self.output_ = MyDense(1)\n",
 								    "\n",
 								    "    def call(self, input):\n",
 								    "        print(\"Tracing MyModel.call()\")\n",
 								    "        hidden1 = self.hidden1(input)\n",
 								    "        hidden2 = self.hidden2(hidden1)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "        concat = tf.keras.layers.concatenate([input, hidden2])\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        output = self.output_(concat)\n",
 								    "        return output\n",
 								    "\n",
 								    "model = MyModel()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 229,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 230,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/2\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "315/363 [=========================>....] - ETA: 0s - loss: 1.5746 - my_mae: 0.8719Tracing MyModel.call()\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 1s 1ms/step - loss: 1.4303 - my_mae: 0.8219 - val_loss: 0.4932 - val_my_mae: 0.4764\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/2\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 1ms/step - loss: 0.4386 - my_mae: 0.4760 - val_loss: 1.0322 - val_my_mae: 0.4793\n",
 								      "162/162 [==============================] - 0s 704us/step - loss: 0.4204 - my_mae: 0.4711\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "[0.4203692376613617, 0.4711270332336426]"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 230,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled, y_train, epochs=2,\n",
 								    "          validation_data=(X_valid_scaled, y_valid))\n",
 								    "model.evaluate(X_test_scaled, y_test)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "You can turn this off by creating the model with `dynamic=True` (or calling `super().__init__(dynamic=True, **kwargs)` in the model's constructor):"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 231,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 232,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model = MyModel(dynamic=True)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 233,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae])"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "Now the custom code will be called at each iteration. Let's fit, validate and evaluate with tiny datasets to avoid getting too much output:"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 234,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n"
 								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "[5.545090198516846, 2.0603599548339844]"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 234,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled[:64], y_train[:64], epochs=1,\n",
 								    "          validation_data=(X_valid_scaled[:64], y_valid[:64]), verbose=0)\n",
 								    "model.evaluate(X_test_scaled[:64], y_test[:64], verbose=0)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Alternatively, you can compile a model with `run_eagerly=True`:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 235,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 236,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model = MyModel()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 237,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "model.compile(loss=my_mse, optimizer=\"nadam\", metrics=[my_mae], run_eagerly=True)"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 238,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n",
 								      "Tracing MyModel.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing MyDense.call()\n",
 								      "Tracing loss my_mse()\n",
 								      "Tracing metric my_mae()\n"
 								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "[5.545090198516846, 2.0603599548339844]"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 238,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
 								    "model.fit(X_train_scaled[:64], y_train[:64], epochs=1,\n",
 								    "          validation_data=(X_valid_scaled[:64], y_valid[:64]), verbose=0)\n",
 								    "model.evaluate(X_test_scaled[:64], y_test[:64], verbose=0)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## Extra Material – Custom Optimizers"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Defining custom optimizers is not very common, but in case you are one of the happy few who gets to write one, here is an example:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 239,
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class MyMomentumOptimizer(tf.keras.optimizers.Optimizer):\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def __init__(self, learning_rate=0.001, momentum=0.9, name=\"MyMomentumOptimizer\", **kwargs):\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "        \"\"\"Gradient descent with momentum optimizer.\"\"\"\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        super().__init__(name, **kwargs)\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "        self._learning_rate = self._build_learning_rate(learning_rate)\n",
 								    "        self.momentum = momentum\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "    def build(self, var_list):\n",
 								    "        \"\"\"Initialize optimizer variables.\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "        Args:\n",
 								    "          var_list: list of model variables to build SGD variables on.\n",
 								    "        \"\"\"\n",
 								    "        super().build(var_list)\n",
 								    "        if getattr(self, \"_built\", False):\n",
 								    "            return\n",
 								    "        self.momentums = []\n",
 								    "        for var in var_list:\n",
 								    "            self.momentums.append(\n",
 								    "                self.add_variable_from_reference(\n",
 								    "                    model_variable=var, variable_name=\"m\"\n",
 								    "                )\n",
 								    "            )\n",
 								    "        self._built = True\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "    def update_step(self, gradient, variable):\n",
 								    "        \"\"\"Update step given gradient and the associated model variable.\"\"\"\n",
 								    "        lr = tf.cast(self.learning_rate, variable.dtype)\n",
 								    "        m = None\n",
 								    "        var_key = self._var_key(variable)\n",
 								    "        momentum = tf.cast(self.momentum, variable.dtype)\n",
 								    "        m = self.momentums[self._index_dict[var_key]]\n",
 								    "        if m is None:\n",
 								    "            variable.assign_add(-gradient * lr)\n",
 								    "        else:\n",
 								    "            m.assign(-gradient * lr + m * momentum)\n",
 								    "            variable.assign_add(m)\n",
 								    "        \n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "        print(\"Config!\")\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        return {\n",
 								    "            **base_config,\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "            \"learning_rate\": self._serialize_hyperparameter(self._learning_rate),\n",
 								    "            \"momentum\": self.momentum,\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "        }"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 240,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/5\n",
 								      "363/363 [==============================] - 0s 660us/step - loss: 1.1844\n",
 								      "Epoch 2/5\n",
 								      "363/363 [==============================] - 0s 625us/step - loss: 0.5635\n",
 								      "Epoch 3/5\n",
 								      "363/363 [==============================] - 0s 609us/step - loss: 0.9703\n",
 								      "Epoch 4/5\n",
 								      "363/363 [==============================] - 0s 627us/step - loss: 0.5678\n",
 								      "Epoch 5/5\n",
 								      "363/363 [==============================] - 0s 640us/step - loss: 0.6350\n"
 								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
 								       "<keras.src.callbacks.History at 0x19c821210>"
 								      ]
 								     },
 								     "execution_count": 240,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
 								   "source": [
 								    "optimizer = MyMomentumOptimizer()\n",
 								    "\n",
 								    "tf.keras.utils.set_random_seed(42)\n",
 								    "model = tf.keras.Sequential([tf.keras.layers.Dense(1, input_shape=[8])])\n",
 								    "model.compile(loss=\"mse\", optimizer=optimizer)\n",
 								    "model.fit(X_train_scaled, y_train, epochs=5)"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "Let's compare that to Keras's built-in momentum optimizer:"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 241,
-												Update notebooks to latest nbformat

											
										
										
											2020-04-06 09:13:12 +02:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "name": "stdout",
 								     "output_type": "stream",
 								     "text": [
 								      "Epoch 1/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 645us/step - loss: 1.1844\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 2/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 721us/step - loss: 0.5635\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 3/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 612us/step - loss: 0.9703\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 4/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 625us/step - loss: 0.5678\n",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      "Epoch 5/5\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								      "363/363 [==============================] - 0s 626us/step - loss: 0.6350\n"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								     ]
 								    },
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<keras.src.callbacks.History at 0x19ea8da20>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 241,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "optimizer = tf.keras.optimizers.SGD(learning_rate=0.001, momentum=0.9)\n",
 								    "\n",
 								    "tf.keras.utils.set_random_seed(42)\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([tf.keras.layers.Dense(1, input_shape=[8])])\n",
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "model.compile(loss=\"mse\", optimizer=optimizer)\n",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								    "model.fit(X_train_scaled, y_train, epochs=5)"
 								   ]
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								  },
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Yep, we get the exact same model! 👍"
 								   ]
 								  },
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "# Exercises"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "## 1. to 11."
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "1. TensorFlow is an open-source library for numerical computation, particularly well suited and fine-tuned for large-scale Machine Learning. Its core is similar to NumPy, but it also features GPU support, support for distributed computing, computation graph analysis and optimization capabilities (with a portable graph format that allows you to train a TensorFlow model in one environment and run it in another), an optimization API based on reverse-mode autodiff, and several powerful APIs such as tf.keras, tf.data, tf.image, tf.signal, and more. Other popular Deep Learning libraries include PyTorch, MXNet, Microsoft Cognitive Toolkit, Theano, Caffe2, and Chainer.\n",
 								    "2. Although TensorFlow offers most of the functionalities provided by NumPy, it is not a drop-in replacement, for a few reasons. First, the names of the functions are not always the same (for example, `tf.reduce_sum()` versus `np.sum()`). Second, some functions do not behave in exactly the same way (for example, `tf.transpose()` creates a transposed copy of a tensor, while NumPy's `T` attribute creates a transposed view, without actually copying any data). Lastly, NumPy arrays are mutable, while TensorFlow tensors are not (but you can use a `tf.Variable` if you need a mutable object).\n",
 								    "3. Both `tf.range(10)` and `tf.constant(np.arange(10))` return a one-dimensional tensor containing the integers 0 to 9. However, the former uses 32-bit integers while the latter uses 64-bit integers. Indeed, TensorFlow defaults to 32 bits, while NumPy defaults to 64 bits.\n",
 								    "4. Beyond regular tensors, TensorFlow offers several other data structures, including sparse tensors, tensor arrays, ragged tensors, queues, string tensors, and sets. The last two are actually represented as regular tensors, but TensorFlow provides special functions to manipulate them (in `tf.strings` and `tf.sets`).\n",
 								    "5. When you want to define a custom loss function, in general you can just implement it as a regular Python function. However, if your custom loss function must support some hyperparameters (or any other state), then you should subclass the `keras.losses.Loss` class and implement the `__init__()` and `call()` methods. If you want the loss function's hyperparameters to be saved along with the model, then you must also implement the `get_config()` method.\n",
 								    "6. Much like custom loss functions, most metrics can be defined as regular Python functions. But if you want your custom metric to support some hyperparameters (or any other state), then you should subclass the `keras.metrics.Metric` class. Moreover, if computing the metric over a whole epoch is not equivalent to computing the mean metric over all batches in that epoch (e.g., as for the precision and recall metrics), then you should subclass the `keras.metrics.Metric` class and implement the `__init__()`, `update_state()`, and `result()` methods to keep track of a running metric during each epoch. You should also implement the `reset_states()` method unless all it needs to do is reset all variables to 0.0. If you want the state to be saved along with the model, then you should implement the `get_config()` method as well.\n",
 								    "7. You should distinguish the internal components of your model (i.e., layers or reusable blocks of layers) from the model itself (i.e., the object you will train). The former should subclass the `keras.layers.Layer` class, while the latter should subclass the `keras.models.Model` class.\n",
 								    "8. Writing your own custom training loop is fairly advanced, so you should only do it if you really need to. Keras provides several tools to customize training without having to write a custom training loop: callbacks, custom regularizers, custom constraints, custom losses, and so on. You should use these instead of writing a custom training loop whenever possible: writing a custom training loop is more error-prone, and it will be harder to reuse the custom code you write. However, in some cases writing a custom training loop is necessary⁠—for example, if you want to use different optimizers for different parts of your neural network, like in the [Wide & Deep paper](https://homl.info/widedeep). A custom training loop can also be useful when debugging, or when trying to understand exactly how training works.\n",
 								    "9. Custom Keras components should be convertible to TF Functions, which means they should stick to TF operations as much as possible and respect all the rules listed in Chapter 12 (in the _TF Function Rules_ section). If you absolutely need to include arbitrary Python code in a custom component, you can either wrap it in a `tf.py_function()` operation (but this will reduce performance and limit your model's portability) or set `dynamic=True` when creating the custom layer or model (or set `run_eagerly=True` when calling the model's `compile()` method).\n",
 								    "10. Please refer to Chapter 12 for the list of rules to respect when creating a TF Function (in the _TF Function Rules_ section).\n",
 								    "11. Creating a dynamic Keras model can be useful for debugging, as it will not compile any custom component to a TF Function, and you can use any Python debugger to debug your code. It can also be useful if you want to include arbitrary Python code in your model (or in your training code), including calls to external libraries. To make a model dynamic, you must set `dynamic=True` when creating it. Alternatively, you can set `run_eagerly=True` when calling the model's `compile()` method. Making a model dynamic prevents Keras from using any of TensorFlow's graph features, so it will slow down training and inference, and you will not have the possibility to export the computation graph, which will limit your model's portability."
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
-												Fix some section levels

											
										
										
											2021-10-02 11:40:18 +02:00
+								    "## 12. Implement a custom layer that performs _Layer Normalization_\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "_We will use this type of layer in Chapter 15 when using Recurrent Neural Networks._"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### a.\n",
 								    "_Exercise: The `build()` method should define two trainable weights *α* and *β*, both of shape `input_shape[-1:]` and data type `tf.float32`. *α* should be initialized with 1s, and *β* with 0s._"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Solution: see below."
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### b.\n",
 								    "_Exercise: The `call()` method should compute the mean_ μ _and standard deviation_ σ _of each instance's features. For this, you can use `tf.nn.moments(inputs, axes=-1, keepdims=True)`, which returns the mean μ and the variance σ<sup>2</sup> of all instances (compute the square root of the variance to get the standard deviation). Then the function should compute and return *α*⊗(*X* - μ)/(σ + ε) + *β*, where ⊗ represents itemwise multiplication (`*`) and ε is a smoothing term (small constant to avoid division by zero, e.g., 0.001)._"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 242,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "class LayerNormalization(tf.keras.layers.Layer):\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "    def __init__(self, eps=0.001, **kwargs):\n",
 								    "        super().__init__(**kwargs)\n",
 								    "        self.eps = eps\n",
 								    "\n",
 								    "    def build(self, batch_input_shape):\n",
 								    "        self.alpha = self.add_weight(\n",
 								    "            name=\"alpha\", shape=batch_input_shape[-1:],\n",
 								    "            initializer=\"ones\")\n",
 								    "        self.beta = self.add_weight(\n",
 								    "            name=\"beta\", shape=batch_input_shape[-1:],\n",
 								    "            initializer=\"zeros\")\n",
 								    "\n",
 								    "    def call(self, X):\n",
 								    "        mean, variance = tf.nn.moments(X, axes=-1, keepdims=True)\n",
 								    "        return self.alpha * (X - mean) / (tf.sqrt(variance + self.eps)) + self.beta\n",
 								    "\n",
 								    "    def get_config(self):\n",
 								    "        base_config = super().get_config()\n",
 								    "        return {**base_config, \"eps\": self.eps}"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Note that making _ε_ a hyperparameter (`eps`) was not compulsory. Also note that it's preferable to compute `tf.sqrt(variance + self.eps)` rather than `tf.sqrt(variance) + self.eps`. Indeed, the derivative of sqrt(z) is undefined when z=0, so training will bomb whenever the variance vector has at least one component equal to 0. Adding _ε_ within the square root guarantees that this will never happen."
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### c.\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "_Exercise: Ensure that your custom layer produces the same (or very nearly the same) output as the `tf.keras.layers.LayerNormalization` layer._"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Let's create one instance of each class, apply them to some data (e.g., the training set), and ensure that the difference is negligeable."
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 243,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<tf.Tensor: shape=(), dtype=float32, numpy=3.9782837e-08>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 243,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "source": [
 								    "X = X_train.astype(np.float32)\n",
 								    "\n",
 								    "custom_layer_norm = LayerNormalization()\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "keras_layer_norm = tf.keras.layers.LayerNormalization()\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "tf.reduce_mean(tf.keras.losses.mean_absolute_error(\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "    keras_layer_norm(X), custom_layer_norm(X)))"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Yep, that's close enough. To be extra sure, let's make alpha and beta completely random and compare again:"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 244,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "text/plain": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "<tf.Tensor: shape=(), dtype=float32, numpy=1.764704e-08>"
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								      ]
 								     },
 								     "execution_count": 244,
 								     "metadata": {},
 								     "output_type": "execute_result"
 								    }
 								   ],
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "random_alpha = np.random.rand(X.shape[-1])\n",
 								    "random_beta = np.random.rand(X.shape[-1])\n",
 								    "\n",
 								    "custom_layer_norm.set_weights([random_alpha, random_beta])\n",
 								    "keras_layer_norm.set_weights([random_alpha, random_beta])\n",
 								    "\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "tf.reduce_mean(tf.keras.losses.mean_absolute_error(\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "    keras_layer_norm(X), custom_layer_norm(X)))"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "Still a negligeable difference! Our custom layer works fine."
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "## 13. Train a model using a custom training loop to tackle the Fashion MNIST dataset\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "_The Fashion MNIST dataset was introduced in Chapter 10._"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### a.\n",
 								    "_Exercise: Display the epoch, iteration, mean training loss, and mean accuracy over each epoch (updated at each iteration), as well as the validation loss and accuracy at the end of each epoch._"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 245,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "(X_train_full, y_train_full), (X_test, y_test) = tf.keras.datasets.fashion_mnist.load_data()\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "X_train_full = X_train_full.astype(np.float32) / 255.\n",
 								    "X_valid, X_train = X_train_full[:5000], X_train_full[5000:]\n",
 								    "y_valid, y_train = y_train_full[:5000], y_train_full[5000:]\n",
 								    "X_test = X_test.astype(np.float32) / 255."
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 246,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 247,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
 								    "    tf.keras.layers.Flatten(input_shape=[28, 28]),\n",
 								    "    tf.keras.layers.Dense(100, activation=\"relu\"),\n",
 								    "    tf.keras.layers.Dense(10, activation=\"softmax\"),\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 248,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "n_epochs = 5\n",
 								    "batch_size = 32\n",
 								    "n_steps = len(X_train) // batch_size\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "optimizer = tf.keras.optimizers.Nadam(learning_rate=0.01)\n",
 								    "loss_fn = tf.keras.losses.sparse_categorical_crossentropy\n",
 								    "mean_loss = tf.keras.metrics.Mean()\n",
 								    "metrics = [tf.keras.metrics.SparseCategoricalAccuracy()]"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 249,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "a0c8a6efecb44efdbaf6f6f2107a37e6",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "ba37766cb41848b4ae0f544c8ddf238f",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 1/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "dc1d7d5c3f2148b1bb06e974bba09f52",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 2/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "a9fccf049df546079656b4fa4d53cf8a",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 3/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "e63ee530efcf46af907e7ee80bea8be0",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 4/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "a9bbff8ceb73461398293a4f5f1cade8",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 5/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    }
 								   ],
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "source": [
 								    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
 								    "    for epoch in epochs:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "            for step in steps:\n",
 								    "                X_batch, y_batch = random_batch(X_train, y_train)\n",
 								    "                with tf.GradientTape() as tape:\n",
 								    "                    y_pred = model(X_batch)\n",
 								    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
 								    "                    loss = tf.add_n([main_loss] + model.losses)\n",
 								    "                gradients = tape.gradient(loss, model.trainable_variables)\n",
 								    "                optimizer.apply_gradients(zip(gradients, model.trainable_variables))\n",
 								    "                for variable in model.variables:\n",
 								    "                    if variable.constraint is not None:\n",
 								    "                        variable.assign(variable.constraint(variable))                    \n",
 								    "                status = OrderedDict()\n",
 								    "                mean_loss(loss)\n",
 								    "                status[\"loss\"] = mean_loss.result().numpy()\n",
 								    "                for metric in metrics:\n",
 								    "                    metric(y_batch, y_pred)\n",
 								    "                    status[metric.name] = metric.result().numpy()\n",
 								    "                steps.set_postfix(status)\n",
 								    "            y_pred = model(X_valid)\n",
 								    "            status[\"val_loss\"] = np.mean(loss_fn(y_valid, y_pred))\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "            status[\"val_accuracy\"] = np.mean(tf.keras.metrics.sparse_categorical_accuracy(\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "                tf.constant(y_valid, dtype=np.float32), y_pred))\n",
 								    "            steps.set_postfix(status)\n",
 								    "        for metric in [mean_loss] + metrics:\n",
 								    "            metric.reset_states()\n"
 								   ]
 								  },
 								  {
 								   "cell_type": "markdown",
 								   "metadata": {},
 								   "source": [
 								    "### b.\n",
 								    "_Exercise: Try using a different optimizer with a different learning rate for the upper layers and the lower layers._"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 250,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								    "tf.keras.utils.set_random_seed(42)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 251,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "lower_layers = tf.keras.Sequential([\n",
 								    "    tf.keras.layers.Flatten(input_shape=[28, 28]),\n",
 								    "    tf.keras.layers.Dense(100, activation=\"relu\"),\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "])\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "upper_layers = tf.keras.Sequential([\n",
 								    "    tf.keras.layers.Dense(10, activation=\"softmax\"),\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "])\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "model = tf.keras.Sequential([\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "    lower_layers, upper_layers\n",
 								    "])"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 252,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "lower_optimizer = tf.keras.optimizers.SGD(learning_rate=1e-4)\n",
 								    "upper_optimizer = tf.keras.optimizers.Nadam(learning_rate=1e-3)"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 253,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
 								   "outputs": [],
 								   "source": [
 								    "n_epochs = 5\n",
 								    "batch_size = 32\n",
 								    "n_steps = len(X_train) // batch_size\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "loss_fn = tf.keras.losses.sparse_categorical_crossentropy\n",
 								    "mean_loss = tf.keras.metrics.Mean()\n",
 								    "metrics = [tf.keras.metrics.SparseCategoricalAccuracy()]"
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   ]
 								  },
 								  {
 								   "cell_type": "code",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "execution_count": 254,
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "metadata": {},
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								   "outputs": [
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "5bdc4d309e3e4f03a27150634a0b89c3",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "All epochs:   0%|          | 0/5 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "b816337dd6ba4177a8bcdd41639a8930",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 1/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "b4cba66f77474d2b9f9de9a207eadf6c",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 2/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "5649fae110bf4f90bce00b39838e05bf",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 3/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "7cd99923c6cc43e78faf87b13be2df7b",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 4/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    },
 								    {
 								     "data": {
 								      "application/vnd.jupyter.widget-view+json": {
-												No longer need super.build() or self.built = True in build() method; also update custom optimizer section and use tf.keras.utils.set_random_seed() instead of tf.random.set_seed()

											
										
										
											2023-09-05 01:38:15 +02:00
+								       "model_id": "39ad913b024f4a2bb31477cfb2d61fbf",
-												Add notebook outputs

											
										
										
											2022-02-19 10:24:54 +01:00
+								       "version_major": 2,
 								       "version_minor": 0
 								      },
 								      "text/plain": [
 								       "Epoch 5/5:   0%|          | 0/1718 [00:00<?, ?it/s]"
 								      ]
 								     },
 								     "metadata": {},
 								     "output_type": "display_data"
 								    }
 								   ],
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								   "source": [
 								    "with trange(1, n_epochs + 1, desc=\"All epochs\") as epochs:\n",
 								    "    for epoch in epochs:\n",
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								    "        with trange(1, n_steps + 1, desc=f\"Epoch {epoch}/{n_epochs}\") as steps:\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "            for step in steps:\n",
 								    "                X_batch, y_batch = random_batch(X_train, y_train)\n",
 								    "                with tf.GradientTape(persistent=True) as tape:\n",
 								    "                    y_pred = model(X_batch)\n",
 								    "                    main_loss = tf.reduce_mean(loss_fn(y_batch, y_pred))\n",
 								    "                    loss = tf.add_n([main_loss] + model.losses)\n",
 								    "                for layers, optimizer in ((lower_layers, lower_optimizer),\n",
 								    "                                          (upper_layers, upper_optimizer)):\n",
 								    "                    gradients = tape.gradient(loss, layers.trainable_variables)\n",
 								    "                    optimizer.apply_gradients(zip(gradients, layers.trainable_variables))\n",
 								    "                del tape\n",
 								    "                for variable in model.variables:\n",
 								    "                    if variable.constraint is not None:\n",
 								    "                        variable.assign(variable.constraint(variable))                    \n",
 								    "                status = OrderedDict()\n",
 								    "                mean_loss(loss)\n",
 								    "                status[\"loss\"] = mean_loss.result().numpy()\n",
 								    "                for metric in metrics:\n",
 								    "                    metric(y_batch, y_pred)\n",
 								    "                    status[metric.name] = metric.result().numpy()\n",
 								    "                steps.set_postfix(status)\n",
 								    "            y_pred = model(X_valid)\n",
 								    "            status[\"val_loss\"] = np.mean(loss_fn(y_valid, y_pred))\n",
-												Replace keras with tf.keras

											
										
										
											2021-10-17 04:04:08 +02:00
+								    "            status[\"val_accuracy\"] = np.mean(tf.keras.metrics.sparse_categorical_accuracy(\n",
-												Add the coding exercise solutions for chapter 12

											
										
										
											2020-03-16 06:51:30 +01:00
+								    "                tf.constant(y_valid, dtype=np.float32), y_pred))\n",
 								    "            steps.set_postfix(status)\n",
 								    "        for metric in [mean_loss] + metrics:\n",
 								    "            metric.reset_states()"
 								   ]
 								  },
 								  {
 								   "cell_type": "code",
 								   "execution_count": null,
 								   "metadata": {},
 								   "outputs": [],
 								   "source": []
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  }
 								 ],
 								 "metadata": {
 								  "kernelspec": {
-												Big update of chapters 11, 12, 13 for 3rd edition

											
										
										
											2022-02-19 06:19:26 +01:00
+								   "display_name": "Python 3",
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								   "language": "python",
 								   "name": "python3"
 								  },
 								  "language_info": {
 								   "codemirror_mode": {
 								    "name": "ipython",
 								    "version": 3
 								   },
 								   "file_extension": ".py",
 								   "mimetype": "text/x-python",
 								   "name": "python",
 								   "nbconvert_exporter": "python",
 								   "pygments_lexer": "ipython3",
-												Update lib versions and add pydot, fixes #29

											
										
										
											2022-09-22 09:14:01 +02:00
+								   "version": "3.10.6"
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								  }
 								 },
 								 "nbformat": 4,
-												Update notebooks to latest nbformat

											
										
										
											2020-04-06 09:13:12 +02:00
+								 "nbformat_minor": 4
-												Add chapter 12 notebook

											
										
										
											2019-03-05 12:46:03 +01:00
+								}