{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Gradient Descent from scratch" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: plotly in /usr/local/lib/python3.6/dist-packages (4.5.0)\n", "Requirement already satisfied: retrying>=1.3.3 in /usr/local/lib/python3.6/dist-packages (from plotly) (1.3.3)\n", "Requirement already satisfied: six in /usr/local/lib/python3.6/dist-packages (from plotly) (1.14.0)\n" ] } ], "source": [ "!pip3 install plotly" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "from random import randint\n", "from typing import List\n", "from plotly import graph_objects as go" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "# The function we want to run Gradient Descent on\n", "# See: https://en.wikipedia.org/wiki/Paraboloid or https://www.wolframalpha.com/input/?i=x%5E2+%2B+y%5E2\n", "def paraboloid(x: float, y: float) -> float:\n", " return x ** 2 + y ** 2" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "xs: [-10, -9, -8, -7, -6, -5, -4, -3, -2, -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10]\n", "\n", "ys: [-10, -9, -8, -7, -6, -5, -4, -3, -2, -1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10]\n", "\n", "zs: [[200, 181, 164, 149, 136, 125, 116, 109, 104, 101, 100, 101, 104, 109, 116, 125, 136, 149, 164, 181, 200], [181, 162, 145, 130, 117, 106, 97, 90, 85, 82, 81, 82, 85, 90, 97, 106, 117, 130, 145, 162, 181], [164, 145, 128, 113, 100, 89, 80, 73, 68, 65, 64, 65, 68, 73, 80, 89, 100, 113, 128, 145, 164], [149, 130, 113, 98, 85, 74, 65, 58, 53, 50, 49, 50, 53, 58, 65, 74, 85, 98, 113, 130, 149], [136, 117, 100, 85, 72, 61, 52, 45, 40, 37, 36, 37, 40, 45, 52, 61, 72, 85, 100, 117, 136]] ...\n", "\n" ] } ], "source": [ "# Test data generation # Test data generation
xs_start = ys_start = -10
xs_stop = ys_stop = 11
xs_step = ys_step = 1

xs: List[float] = [i for i in range(xs_start, xs_stop, xs_step)]
ys: List[float] = [i for i in range(ys_start, ys_stop, ys_step)]
zs: List[List[float]] = []

for x in xs:
 temp_res: List[float] = []
 for y in ys:
  result: float = paraboloid(x, y)
  temp_res.append(result)
 zs.append(temp_res)

print(f'xs: {xs}\n')
print(f'ys: {ys}\n')
print(f'zs: {zs[:5]} ...\n') " ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "# Plotting the generated test data\n", "fig = go.Figure(go.Surface(x=xs, y=ys, z=zs, colorscale='Viridis'))\n", "fig.show()" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "# The Gradient is a vector pointing in the direction of greatest increase\n", "# This function computes gradients for our Paraboloid function (defined above)\n", "# See: https://www.wolframalpha.com/input/?i=gradient+of+x%5E2+%2B+y%5E2\n", "def compute_gradient(vec: List[float]) -> List[float]:\n", " assert len(vec) == 2\n", " x: float = vec[0]\n", " y: float = vec[1]\n", " # The derivative of z with respect to x is 2 * x\n", " # The derivative of z with respect to y is 2 * y\n", " return [2 * x, 2 * y]" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [], "source": [ "# This function computes the next position based on the current position, its computed gradient and the learning rate\n", "def compute_step(curr_pos: List[float], learning_rate: float) -> List[float]:\n", " grad: List[float] = compute_gradient(curr_pos)\n", " grad[0] *= -learning_rate\n", " grad[1] *= -learning_rate\n", " next_pos: List[float] = [0, 0]\n", " next_pos[0] = curr_pos[0] + grad[0]\n", " next_pos[1] = curr_pos[1] + grad[1]\n", " return next_pos" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "[4, 7]" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# Pick a random starting position on the surface of our Paraboloid\n", "start_pos: List[float]\n", "\n", "# Ensure that we don't start at a minimum (0, 0 in our case)\n", "while True:\n", " start_x: float = randint(xs_start, xs_stop)\n", " start_y: float = randint(ys_start, ys_stop)\n", " if start_x != 0 and start_y != 0:\n", " start_pos = [start_x, start_y]\n", " break\n", "\n", "start_pos" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Epoch 0: [3.992, 6.986]\n", "Epoch 500: [1.4671049293897798, 2.5674336264321123]\n", "Epoch 1000: [0.539177573607161, 0.9435607538125328]\n", "Epoch 1500: [0.19815382666720605, 0.34676919666761064]\n", "Epoch 2000: [0.07282376149321286, 0.12744158261312272]\n", "Epoch 2500: [0.026763551969789107, 0.04683621594713106]\n", "Epoch 3000: [0.009835906568851993, 0.017212836495491053]\n", "Epoch 3500: [0.003614806365776567, 0.006325911140109013]\n", "Epoch 4000: [0.0013284820235521919, 0.0023248435412163435]\n", "Epoch 4500: [0.00048823209553084355, 0.00085440616717898]\n", "Best guess for a minimum: [0.00017979037083174428, 0.00031463314895555317]\n" ] } ], "source": [ "epochs: int = 5000\n", "learning_rate: float = 0.001\n", " \n", "best_pos: List[float] = start_pos\n", "\n", "for i in range(0, epochs):\n", " next_pos: List[float] = compute_step(best_pos, learning_rate)\n", " # Print some debug information every once in a while \n", " if i % 500 == 0:\n", " print(f'Epoch {i}: {next_pos}')\n", " best_pos = next_pos \n", "\n", "print(f'Best guess for a minimum: {best_pos}')" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.9" } }, "nbformat": 4, "nbformat_minor": 4 }