Calculus - Week 2#

[1]:

import re
from itertools import product

import matplotlib.pyplot as plt
import numpy as np
import plotly.graph_objects as go
import plotly.io as pio
import sympy as sp
from IPython.core.getipython import get_ipython
from IPython.display import display, HTML
from matplotlib.animation import FuncAnimation

plt.style.use("seaborn-v0_8-whitegrid")
pio.renderers.default = "plotly_mimetype+notebook"

Multivariate optimization#

Tangent plane#

The equation of the tangent line to $f(x)$ at point $x=a$ is

📐 $y = \cfrac{d}{dx}f(a)(x-a) + f(a)$

This is derived from the point-slope form of a line

$y-y_1 = m(x-x_1)$

The equation of the tangent plane to $f(x, y)$ at point $x=a$ and $y=b$ is

📐 $z = \cfrac{\partial}{\partial x}f(a)(x-a) + \cfrac{\partial}{\partial y}f(b)(y-b) + f(a, b)$

which, similarly, is derived from the point-slope form of a plane

$z-z_1 = m_1(x-x_1) + m_2(y-y_1)$

[2]:

def tangent_line(dfa, a, sym_a, a_range, b, sym_b, f):
    return (
        dfa.evalf(subs={sym_a: a, sym_b: b}) * (a_range - a)
        + f.evalf(subs={x: a, y: b})
    ).astype("float32")


def tangent_plane(dfa, dfb, a, a_range, b, b_range, f):
    return (
        dfa.evalf(subs={x: a, y: b}) * (a_range - a)
        + dfb.evalf(subs={x: a, y: b}) * (b_range - b)
        + f.evalf(subs={x: a, y: b})
    ).astype("float32")


x, y = sp.symbols("x, y")
parabloid = x**2 + y**2
dfx = sp.diff(parabloid, x)
dfy = sp.diff(parabloid, y)
x0 = 2
y0 = 4
full_range = np.linspace(-8, 8, 100)
y_cut_xx, y_cut_yy = np.meshgrid(full_range, np.linspace(-8, y0, 100))
xcut_xx, xcut_yy = np.meshgrid(np.linspace(-8, x0, 100), full_range)
full_xx, full_yy = np.meshgrid(full_range, full_range)
tan_x = np.linspace(x0 - 4, x0 + 4, 100)
tan_y = np.linspace(y0 - 4, y0 + 4, 100)
tan_xx, tan_yy = np.meshgrid(tan_x, tan_y)
const_x = np.full(100, x0)
const_y = np.full(100, y0)

ycut_parabloid_surface = go.Surface(
    z=sp.lambdify((x, y), parabloid, "numpy")(y_cut_xx, y_cut_yy),
    x=y_cut_xx,
    y=y_cut_yy,
    colorscale="Blues",
    contours=dict(x=dict(show=True), y=dict(show=True), z=dict(show=True)),
    colorbar=dict(orientation="h", y=-0.2, title=dict(text="z", side="top")),
    showlegend=True,
    legendgrouptitle_text="Partial derivative wrt x",
    legendgroup="x",
    name="y-cut parabloid",
)
xcut_parabloid_surface = go.Surface(
    z=sp.lambdify((x, y), parabloid, "numpy")(xcut_xx, xcut_yy),
    x=xcut_xx,
    y=xcut_yy,
    colorscale="Blues",
    contours=dict(x=dict(show=True), y=dict(show=True), z=dict(show=True)),
    colorbar=dict(orientation="h", y=-0.2, title=dict(text="z", side="top")),
    showlegend=True,
    legendgrouptitle_text="Partial derivative wrt y",
    legendgroup="y",
    name="x-cut parabloid",
)
full_parabloid_surface = go.Surface(
    z=sp.lambdify((x, y), parabloid, "numpy")(full_xx, full_yy),
    x=full_xx,
    y=full_yy,
    colorscale="Blues",
    contours=dict(x=dict(show=True), y=dict(show=True), z=dict(show=True)),
    colorbar=dict(orientation="h", y=-0.2, title=dict(text="z", side="top")),
    showlegend=True,
    name="full parabloid",
)
poi = go.Scatter3d(
    x=[x0],
    y=[y0],
    z=[sp.lambdify((x, y), parabloid, "numpy")(x0, y0)],
    marker=dict(color="#000000"),
    showlegend=True,
    name="x=2 y=4",
)
yparabola = go.Scatter3d(
    x=const_x,
    y=full_range,
    z=sp.lambdify((x, y), parabloid, "numpy")(const_x, full_range),
    mode="lines",
    line=dict(color="#000000", width=5),
    showlegend=True,
    legendgroup="y",
    name="y parabola",
)
ytangent = go.Scatter3d(
    x=const_x,
    y=tan_y,
    z=tangent_line(dfa=dfy, a=y0, sym_a=y, a_range=tan_y, b=x0, sym_b=x, f=parabloid),
    mode="lines",
    line=dict(color="#000000"),
    showlegend=True,
    legendgroup="y",
    name="y tangent",
)
xparabola = go.Scatter3d(
    x=full_range,
    y=const_y,
    z=sp.lambdify((x, y), parabloid, "numpy")(full_range, const_y),
    mode="lines",
    line=dict(color="#000000", width=5),
    showlegend=True,
    legendgroup="x",
    name="x parabola",
)
xtangent = go.Scatter3d(
    x=tan_x,
    y=const_y,
    z=tangent_line(dfa=dfx, a=x0, sym_a=x, a_range=tan_x, b=y0, sym_b=y, f=parabloid),
    mode="lines",
    line=dict(color="#000000"),
    showlegend=True,
    legendgroup="x",
    name="x tangent",
)
tangent_surface = go.Surface(
    z=tangent_plane(
        dfa=dfx, dfb=dfy, a=x0, a_range=tan_xx, b=y0, b_range=tan_yy, f=parabloid
    ),
    x=tan_xx,
    y=tan_yy,
    colorscale=[[0, "#FF8920"], [1, "#FF8920"]],
    showscale=False,
    name="tangent plane",
    showlegend=True,
)
fig = go.Figure(
    data=[
        full_parabloid_surface,
        xcut_parabloid_surface,
        ycut_parabloid_surface,
        poi,
        xtangent,
        xparabola,
        ytangent,
        yparabola,
        tangent_surface,
    ]
)
fig.update_layout(
    title="Tangent plane of parabloid at x=2 and y=4",
    autosize=False,
    width=600,
    height=600,
    margin=dict(l=10, r=10, b=10, t=30),
    legend=dict(groupclick="togglegroup", itemclick="toggleothers"),
    scene_camera=dict(
        eye=dict(x=1.5, y=1.5, z=0.5),
    ),
)
fig.show()

Partial derivatives#

If we look at the tangent plane on the previous plot from a certain angle we’ll see two orthogonal lines, as if they were the axes of the plane.

😉 click on Reset camera to last save on the plot’s navbar to reset the eye to (x=1.5, y=1.5, z=.5)

The two lines that form the tangent plane are the tangent lines to the point and their respective slopes are called partial derivatives.

To visualize (or at least get a sense of it) the partial derivative:

$\cfrac{\partial}{\partial x}f(x)$ at $x=2$ select the legend group Partial derivative wrt x.

$\cfrac{\partial}{\partial y}f(y)$ at $y=4$ select the legend group Partial derivative wrt y.

In either case, we can see that the partial derivative is just the derivative of the imaginary 2D parabola that results from $f(x, y)$ while keeping one of the two variables constant.

In fact, calculating partial derivatives is a 2-step process:

treat all the other variables as constants
apply the same rules of differentiations

For example, let $f(x, y) = x^2+y^2$. To calculate $\cfrac{\partial}{\partial x}x^2+y^2$ we

treat $y$ as a constant, let’s say 1, but we don’t usually do this substitution in practice. We’ll do it here to drive the point home.

$\cfrac{\partial f(x,y)}{\partial x} = x^2+1^2$

apply the same rules of differentiations (in this case, power, constant and sum rules)

$\cfrac{\partial f(x,y)}{\partial x} = 2x + 0$

Let’s do another example. Let let $f(x, y) = x^2y^2$.

We could do the same as before and replace $y$ with 1, but in this case and more complex cases it might create more confusion than be helpful, as we’ll have to revert it back to $y$ if it didn’t go away like it did in the previous example.

Let’s leave $y$ as is and just treat as a constant. For the power and multiple constant rules we have

$\cfrac{\partial f(x,y)}{\partial x} = 2xy^2$

Equaling partial derivatives to 0 to find the minima and maxima#

Let’s imagine we are in a sauna 5 meters wide and 5 meters long. We want to find the coldest place in the room.

Conveniently we know the function of the temperature in terms of the room coordinates.

[3]:

x, y = sp.symbols("x, y")
temp = 50 - sp.Rational(1, 50) * x**2 * (x - 6) * y**2 * (y - 6)
temp

[3]:

$\displaystyle - \frac{x^{2} y^{2} \left(x - 6\right) \left(y - 6\right)}{50} + 50$

[4]:

room_size = 5
xx, yy = np.meshgrid(np.linspace(0, room_size, 100), np.linspace(0, room_size, 100))

surface = go.Surface(
    z=sp.lambdify((x, y), temp, "numpy")(xx, yy),
    x=xx,
    y=yy,
    colorscale="RdBu_r",
    contours=dict(x=dict(show=True), y=dict(show=True), z=dict(show=True)),
    colorbar=dict(title="Temperature"),
    name="temperature function",
)

fig = go.Figure(surface)
fig.update_layout(
    title="Function of the sauna temperature",
    autosize=False,
    width=600,
    height=600,
    scene_aspectmode="cube",
    margin=dict(l=10, r=10, b=10, t=30),
    scene_camera=dict(
        eye=dict(x=2.1, y=0.1, z=0.7),
    ),
)
fig.show()

Let’s calculate the partial derivative wrt x.

[5]:

dfx = sp.diff(temp, x).factor()
dfx

[5]:

$\displaystyle - \frac{3 x y^{2} \left(x - 4\right) \left(y - 6\right)}{50}$

Let’s calculate the partial derivative wrt y.

[6]:

dfy = sp.diff(temp, y).factor()
dfy

[6]:

$\displaystyle - \frac{3 x^{2} y \left(x - 6\right) \left(y - 4\right)}{50}$

Let’s check where the partial derivatives are 0.

[7]:

solutions = {"x": set(), "y": set()}
for s in sp.solve(dfx) + sp.solve(dfy):
    for k, v in s.items():
        if v <= room_size:
            solutions[str(k)].add(float(v))
solutions = list(product(solutions["x"], solutions["y"]))

zs = []
for s in solutions:
    z = sp.lambdify((x, y), temp, "numpy")(s[0], s[1])
    zs.append(z)
    fig.add_scatter3d(
        x=[s[0]],
        y=[s[1]],
        z=[z],
        marker=dict(color="#67001F" if z > 40 else "#053061"),
        name="maximum" if z > 40 else "minimum",
    )
fig.update_layout(
    title="Maxima and minima of the function",
    showlegend=False,
    scene_camera=dict(
        eye=dict(x=2.0, y=-1.0, z=0.2),
    ),
)
fig.show()

Let’s show the tangent plane at the minimum point.

[8]:

x0, y0 = solutions[np.argmin(zs)]
tan_x = np.linspace(x0 - 1, x0 + 1, 100)
tan_y = np.linspace(y0 - 1, y0 + 1, 100)
tan_xx, tan_yy = np.meshgrid(tan_x, tan_y)
const_x = np.full(100, x0)
const_y = np.full(100, y0)

ytangent = go.Scatter3d(
    x=const_x,
    y=tan_y,
    z=tangent_line(dfa=dfy, a=y0, sym_a=y, a_range=tan_y, b=x0, sym_b=x, f=temp),
    mode="lines",
    line=dict(color="#000000"),
    showlegend=True,
    legendgroup="y",
    name="y tangent",
)

xtangent = go.Scatter3d(
    x=tan_x,
    y=const_y,
    z=tangent_line(dfa=dfx, a=x0, sym_a=x, a_range=tan_x, b=y0, sym_b=y, f=temp),
    mode="lines",
    line=dict(color="#000000"),
    showlegend=True,
    legendgroup="x",
    name="x tangent",
)

tangent_surface = go.Surface(
    z=tangent_plane(
        dfa=dfx, dfb=dfy, a=x0, a_range=tan_xx, b=y0, b_range=tan_yy, f=temp
    ),
    x=tan_xx,
    y=tan_yy,
    colorscale=[[0, "#FF8920"], [1, "#FF8920"]],
    showscale=False,
    name="tangent plane",
    showlegend=True,
)

fig.add_traces([ytangent, xtangent, tangent_surface])
fig.update_layout(
    title="Tangent plane at the minimum",
)
fig.show()

Mathematics for Machine Learning and Data Science

Calculus - Week 2

Contents

Calculus - Week 2#

Multivariate optimization#

Tangent plane#

Partial derivatives#

Equaling partial derivatives to 0 to find the minima and maxima#

Gradient#