3b1b-manim/nn/part3.py

from nn.network import *
from nn.part1 import *
from nn.part2 import *

class LayOutPlan(Scene):
    def construct(self):
        title = TextMobject("Plan")
        title.scale(1.5)
        title.to_edge(UP)
        h_line = Line(LEFT, RIGHT).scale(SPACE_WIDTH - 1)
        h_line.next_to(title, DOWN)

        items = BulletedList(
            "Recap",
            "Intuitive walkthrough",
            "Derivatives in \\\\ computational graphs",
        )
        items.to_edge(LEFT, buff = LARGE_BUFF)
        self.add(items)

        rect = ScreenRectangle()
        rect.scale_to_fit_width(2*SPACE_WIDTH - items.get_width() - 2)
        rect.next_to(items, RIGHT, MED_LARGE_BUFF)

        self.play(
            Write(title),
            ShowCreation(h_line),
            ShowCreation(rect),
            run_time = 2
        )
        for i in range(len(items)):
            self.play(items.fade_all_but, i)
            self.dither(2)

class TODOInsertFeedForwardAnimations(TODOStub):
    CONFIG = {
        "message" : "Insert Feed Forward Animations"
    }

class TODOInsertStepsDownCostSurface(TODOStub):
    CONFIG = {
        "message" : "Insert Steps Down Cost Surface"
    }

class TODOInsertDefinitionOfCostFunction(TODOStub):
    CONFIG = {
        "message" : "Insert Definition of cost function"
    }

class TODOInsertGradientNudging(TODOStub):
    CONFIG = {
        "message" : "Insert GradientNudging"
    }

class InterpretGradientComponents(GradientNudging):
    CONFIG = {
        "network_mob_config" : {
            "layer_to_layer_buff" : 3,
        },
        "stroke_width_exp" : 2,
        "n_decimals" : 6,
        "n_steps" : 3,
        "start_cost" : 3.48,
        "delta_cost" : -0.21,
    }
    def construct(self):
        self.setup_network()
        self.add_cost()
        self.add_gradient()
        self.change_weights_repeatedly()
        self.ask_about_high_dimensions()
        self.circle_magnitudes()
        self.isolate_particular_weights()
        self.shift_cost_expression()
        self.tweak_individual_weights()

    def setup_network(self):
        self.network_mob.scale(0.55)
        self.network_mob.to_corner(UP+RIGHT)
        self.color_network_edges()

    def add_cost(self):
        rect = SurroundingRectangle(self.network_mob)
        rect.highlight(RED)
        arrow = Vector(DOWN, color = RED)
        arrow.shift(rect.get_bottom())
        cost = DecimalNumber(self.start_cost)
        cost.highlight(RED)
        cost.next_to(arrow, DOWN)

        cost_expression = TexMobject(
            "C(", "w_0, w_1, \\dots, w_{13{,}001}", ")", "="
        )
        for tex in "()":
            cost_expression.highlight_by_tex(tex, RED)
        cost_expression.next_to(cost, DOWN)
        cost_group = VGroup(cost_expression, cost)
        cost_group.arrange_submobjects(RIGHT)
        cost_group.next_to(arrow, DOWN)

        self.add(rect, arrow, cost_group)

        self.set_variables_as_attrs(
            cost, cost_expression, cost_group,
            network_rect = rect
        )

    def change_weights_repeatedly(self):
        decimals = self.grad_vect.decimals
        grad_terms = self.grad_vect.contents
        edges = VGroup(*reversed(list(
            it.chain(*self.network_mob.edge_groups)
        )))
        cost = self.cost

        for x in range(self.n_steps):
            self.move_grad_terms_into_position(
                grad_terms.copy(),
                *self.get_weight_adjustment_anims(edges, cost)
            )
            self.play(*self.get_decimal_change_anims(decimals))

    def ask_about_high_dimensions(self):
        grad_vect = self.grad_vect

        words = TextMobject(
            "Direction in \\\\ ${13{,}002}$ dimensions?!?")
        words.highlight(YELLOW)
        words.move_to(grad_vect).to_edge(DOWN)
        arrow = Arrow(
            words.get_top(),
            grad_vect.get_bottom(),
            buff = SMALL_BUFF
        )

        randy = Randolph()
        randy.scale(0.6)
        randy.next_to(words, LEFT)
        randy.shift_onto_screen()

        self.play(
            Write(words, run_time = 2), 
            GrowArrow(arrow),
        )
        self.play(FadeIn(randy))
        self.play(randy.change, "confused", words)
        self.play(Blink(randy))
        self.dither()
        self.play(*map(FadeOut, [randy, words, arrow]))

    def circle_magnitudes(self):
        rects = VGroup()
        for decimal in self.grad_vect.decimals:
            rects.add(SurroundingRectangle(VGroup(*decimal[-5:])))
        rects.highlight(WHITE)

        self.play(LaggedStart(ShowCreation, rects))
        self.play(FadeOut(rects))

    def isolate_particular_weights(self):
        vect_contents = self.grad_vect.contents
        w_terms = self.cost_expression[1]

        edges = self.network_mob.edge_groups
        edge1 = self.network_mob.layers[1].neurons[3].edges_in[0].copy()
        edge2 = self.network_mob.layers[1].neurons[9].edges_in[15].copy()
        VGroup(edge1, edge2).set_stroke(width = 4)
        d1 = DecimalNumber(3.2)
        d2 = DecimalNumber(0.1)
        VGroup(edge1, d1).highlight(YELLOW)
        VGroup(edge2, d2).highlight(MAROON_B)
        new_vect_contents = VGroup(
            TexMobject("\\vdots"),
            d1, TexMobject("\\vdots"),
            d2, TexMobject("\\vdots"),
        )
        new_vect_contents.arrange_submobjects(DOWN)
        new_vect_contents.move_to(vect_contents)

        new_w_terms = TexMobject(
            "\\dots", "w_n", "\\dots", "w_k", "\\dots"
        )
        new_w_terms.move_to(w_terms, DOWN)
        new_w_terms[1].highlight(d1.get_color())
        new_w_terms[3].highlight(d2.get_color())

        for d, edge in (d1, edge1), (d2, edge2):
            d.arrow = Arrow(
                d.get_right(), edge.get_center(),
                color = d.get_color()
            )

        self.play(
            FadeOut(vect_contents),
            FadeIn(new_vect_contents),
            FadeOut(w_terms),
            FadeIn(new_w_terms),
            edges.set_stroke, LIGHT_GREY, 0.35,
        )
        self.play(GrowArrow(d1.arrow))
        self.play(ShowCreation(edge1))
        self.dither()
        self.play(GrowArrow(d2.arrow))
        self.play(ShowCreation(edge2))
        self.dither(2)

        self.cost_expression.remove(w_terms)
        self.cost_expression.add(new_w_terms)
        self.set_variables_as_attrs(
            edge1, edge2, new_w_terms, 
            new_decimals = VGroup(d1, d2)
        )

    def shift_cost_expression(self):
        self.play(self.cost_group.shift, DOWN+0.5*LEFT)

    def tweak_individual_weights(self):
        cost = self.cost
        cost_num = cost.number
        edges = VGroup(self.edge1, self.edge2)
        decimals = self.new_decimals
        changes = (1.0, 1./32)
        wn = self.new_w_terms[1]
        wk = self.new_w_terms[3]

        number_line_template = NumberLine(
            x_min = -1,
            x_max = 1,
            tick_frequency = 0.25,
            numbers_with_elongated_ticks = [],
            color = WHITE
        )
        for term in wn, wk, cost:
            term.number_line = number_line_template.copy()
            term.brace = Brace(term.number_line, DOWN, buff = SMALL_BUFF)
            group = VGroup(term.number_line, term.brace)
            group.next_to(term, UP)
            term.dot = Dot()
            term.dot.highlight(term.get_color())
            term.dot.move_to(term.number_line.get_center())
            term.dot.save_state()
            term.dot.move_to(term)
            term.dot.set_fill(opacity = 0)
            term.words = TextMobject("Nudge this weight")
            term.words.scale(0.7)
            term.words.next_to(term.number_line, UP, MED_SMALL_BUFF)

        groups = [
            VGroup(d, d.arrow, edge, w)
            for d, edge, w in zip(decimals, edges, [wn, wk])
        ]
        for group in groups:
            group.save_state()

        for i in range(2):
            group1, group2 = groups[i], groups[1-i]
            change = changes[i]
            edge = edges[i]
            w = group1[-1]
            added_anims = []
            if i == 0:
                added_anims = [
                    GrowFromCenter(cost.brace),
                    ShowCreation(cost.number_line),
                    cost.dot.restore
                ]
            self.play(
                group1.restore,
                group2.fade, 0.7,
                GrowFromCenter(w.brace),
                ShowCreation(w.number_line),
                w.dot.restore,
                Write(w.words, run_time = 1),
                *added_anims
            )
            for x in range(2):
                func = lambda a : interpolate(
                    cost_num, cost_num-change, a
                )
                self.play(
                    ChangingDecimal(cost, func),
                    cost.dot.shift, change*RIGHT,
                    w.dot.shift, 0.25*RIGHT,
                    edge.set_stroke, None, 8,
                    rate_func = lambda t : wiggle(t, 4),
                    run_time = 2,
                )
                self.dither()
            self.play(*map(FadeOut, [
                w.dot, w.brace, w.number_line, w.words
            ]))


    ######

    def move_grad_terms_into_position(self, grad_terms, *added_anims):
        cost_expression = self.cost_expression
        w_terms = self.cost_expression[1]
        points = VGroup(*[
            VectorizedPoint()
            for term in grad_terms
        ])
        points.arrange_submobjects(RIGHT)
        points.replace(w_terms, dim_to_match = 0)

        grad_terms.generate_target()
        grad_terms.target[len(grad_terms)/2].rotate(np.pi/2)
        grad_terms.target.arrange_submobjects(RIGHT)
        grad_terms.target.scale_to_fit_width(cost_expression.get_width())
        grad_terms.target.next_to(cost_expression, DOWN)

        words = TextMobject("Nudge weights")
        words.scale(0.8)
        words.next_to(grad_terms.target, DOWN)

        self.play(
            MoveToTarget(grad_terms),
            FadeIn(words)
        )
        self.play(
            Transform(
                grad_terms, points,
                remover = True,
                submobject_mode = "lagged_start",
                run_time = 1
            ),
            FadeOut(words),
            *added_anims
        )

    def get_weight_adjustment_anims(self, edges, cost):
        start_cost = cost.number
        target_cost = start_cost + self.delta_cost
        w_terms = self.cost_expression[1]

        return [
            self.get_edge_change_anim(edges),
            LaggedStart(
                Indicate, w_terms,
                rate_func = there_and_back,
                run_time = 1.5,
            ),
            ChangingDecimal(
                cost, 
                lambda a : interpolate(start_cost, target_cost, a),
                run_time = 1.5
            )
        ]

class GetLostInNotation(PiCreatureScene):
    def construct(self):
        morty = self.pi_creature
        equations = VGroup(
            TexMobject(
                "\\delta", "^L", "=", "\\nabla_a", "C", 
                "\\odot \\sigma'(", "z", "^L)"
            ),
            TexMobject(
                "\\delta", "^l = ((", "w", "^{l+1})^T", 
                "\\delta", "^{l+1}) \\odot \\sigma'(", "z", "^l)"
            ),
            TexMobject(
                "{\\partial", "C", "\\over \\partial", "b", 
                "_j^l} =", "\\delta", "_j^l"
            ),
            TexMobject(
                "{\\partial", "C", " \\over \\partial", 
                "w", "_{jk}^l} = ", "a", "_k^{l-1}", "\\delta", "_j^l"
            ),
        )
        for equation in equations:
            equation.highlight_by_tex_to_color_map({
                "\\delta" : YELLOW,
                "C" : RED,
                "b" : MAROON_B,
                "w" : BLUE,
                "z" : TEAL,
            })
            equation.highlight_by_tex("nabla", WHITE)
        equations.arrange_submobjects(
            DOWN, buff = MED_LARGE_BUFF, aligned_edge = LEFT
        )

        circle = Circle(radius = 3*SPACE_WIDTH)
        circle.set_fill(WHITE, 0)
        circle.set_stroke(WHITE, 0)

        self.play(
            Write(equations),
            morty.change, "confused", equations
        )
        self.dither()
        self.play(morty.change, "pleading")
        self.dither(2)

        ##
        movers = VGroup(*equations.family_members_with_points())
        random.shuffle(movers.submobjects)
        for mover in list(movers):
            if mover.is_subpath:
                movers.remove(mover)
                continue
            mover.set_stroke(WHITE, width = 0)
            mover.target = Circle()
            mover.target.scale(0.5)
            mover.target.set_fill(mover.get_color(), opacity = 0)
            mover.target.set_stroke(BLACK, width = 1)
            mover.target.move_to(mover)
        self.play(
            LaggedStart(
                MoveToTarget, movers,
                run_time = 2,
            ),
            morty.change, "pondering",
        )
        self.dither()

class TODOInsertPreviewLearning(TODOStub):
    CONFIG = {
        "message" : "Insert PreviewLearning"
    }

class ShowAveragingCost(PreviewLearning):
    CONFIG = {
        "network_scale_val" : 0.8,
        "stroke_width_exp" : 1,
        "start_examples_time" : 5,
        "examples_per_adjustment_time" : 2,
        "n_adjustments" : 5,
        "time_per_example" : 1./15,
        "image_height" : 1.2,
    }
    def construct(self):
        self.setup_network()
        self.setup_diff_words()
        self.show_many_examples()

    def setup_network(self):
        self.network_mob.scale(self.network_scale_val)
        self.network_mob.to_edge(DOWN)
        self.network_mob.shift(LEFT)
        self.color_network_edges()

    def setup_diff_words(self):
        last_layer_copy = self.network_mob.layers[-1].deepcopy()
        last_layer_copy.add(self.network_mob.output_labels.copy())
        last_layer_copy.shift(1.5*RIGHT)

        double_arrow = DoubleArrow(
            self.network_mob.output_labels,
            last_layer_copy,
            color = RED
        )
        brace = Brace(
            VGroup(self.network_mob.layers[-1], last_layer_copy), 
            UP
        )
        cost_words = brace.get_text("Cost of \\\\ one example")
        cost_words.highlight(RED)

        self.add(last_layer_copy, double_arrow, brace, cost_words)
        self.set_variables_as_attrs(
            last_layer_copy, double_arrow, brace, cost_words
        )
        self.last_layer_copy = last_layer_copy

    def show_many_examples(self):
        training_data, validation_data, test_data = load_data_wrapper()
        training_data_iter = iter(training_data)

        average_words = TextMobject("Average over all training examples")
        average_words.next_to(LEFT, RIGHT)
        average_words.to_edge(UP)
        self.add(average_words)

        for x in xrange(int(self.start_examples_time/self.time_per_example)):
            train_in, train_out = training_data_iter.next()
            self.show_one_example(train_in, train_out)
            self.dither(self.time_per_example)

        #Wiggle all edges
        edges = VGroup(*it.chain(*self.network_mob.edge_groups))
        reversed_edges = VGroup(*reversed(edges))
        self.play(LaggedStart(
            ApplyFunction, edges,
            lambda edge : (
                lambda m : m.rotate_in_place(np.pi/12).highlight(YELLOW),
                edge,
            ),
            rate_func = lambda t : wiggle(t, 4),
            run_time = 3,
        ))

        #Show all, then adjust
        words = TextMobject(
            "Each step \\\\ uses every \\\\ example\\\\",
            "$\\dots$theoretically",
            alignment = ""
        )
        words.highlight(YELLOW)
        words.scale(0.8)
        words.to_corner(UP+LEFT)

        for x in xrange(self.n_adjustments):
            for y in xrange(int(self.examples_per_adjustment_time/self.time_per_example)):
                train_in, train_out = training_data_iter.next()
                self.show_one_example(train_in, train_out)
                self.dither(self.time_per_example)
            self.play(LaggedStart(
                ApplyMethod, reversed_edges,
                lambda m : (m.rotate_in_place, np.pi),
                run_time = 1,
                lag_ratio = 0.2,
            ))
            if x < 2:
                self.play(FadeIn(words[x]))
            else:
                self.dither()

    ####

    def show_one_example(self, train_in, train_out):
        if hasattr(self, "curr_image"):
            self.remove(self.curr_image)
        image = MNistMobject(train_in)
        image.scale_to_fit_height(self.image_height)
        image.next_to(
            self.network_mob.layers[0].neurons, UP,
            aligned_edge = LEFT
        )
        self.add(image)
        self.network_mob.activate_layers(train_in)

        index = np.argmax(train_out)
        self.last_layer_copy.neurons.set_fill(opacity = 0)
        self.last_layer_copy.neurons[index].set_fill(WHITE, opacity = 1)
        self.add(self.last_layer_copy)

        self.curr_iamge = image


class WalkThroughTwoExample(ShowAveragingCost):
    def construct(self):
        self.force_skipping()

        self.setup_network()
        self.setup_diff_words()
        self.show_single_example()
        self.expand_last_layer()
        self.cannot_directly_affect_activations()
        self.show_desired_activation_nudges()
        self.focus_on_one_neuron()
        self.show_activation_formula()
        self.three_ways_to_increase()
        self.note_connections_to_brightest_neurons()

    def show_single_example(self):
        two_vect = get_organized_images()[2][0]
        two_out = np.zeroes(10)
        two_out[2] = 1.0
        self.show_one_example(two_vect, two_out)
        for layer in self.network_mob.layers:
            layer.neurons.set_fill(opacity = 0)

        self.revert_to_original_skipping_status()
        self.feed_forward(two_vect)

    def expand_last_layer(self):
        pass

    def cannot_directly_affect_activations(self):
        pass

    def show_desired_activation_nudges(self):
        pass

    def focus_on_one_neuron(self):
        pass

    def show_activation_formula(self):
        pass

    def three_ways_to_increase(self):
        pass

    def note_connections_to_brightest_neurons(self):
        pass
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00			`from nn.network import *`
			`from nn.part1 import *`
			`from nn.part2 import *`

			`class LayOutPlan(Scene):`
			`def construct(self):`
			`title = TextMobject("Plan")`
			`title.scale(1.5)`
			`title.to_edge(UP)`
			`h_line = Line(LEFT, RIGHT).scale(SPACE_WIDTH - 1)`
			`h_line.next_to(title, DOWN)`

			`items = BulletedList(`
			`"Recap",`
			`"Intuitive walkthrough",`
			`"Derivatives in \\\\ computational graphs",`
			`)`
			`items.to_edge(LEFT, buff = LARGE_BUFF)`
			`self.add(items)`

			`rect = ScreenRectangle()`
			`rect.scale_to_fit_width(2*SPACE_WIDTH - items.get_width() - 2)`
			`rect.next_to(items, RIGHT, MED_LARGE_BUFF)`

			`self.play(`
			`Write(title),`
			`ShowCreation(h_line),`
			`ShowCreation(rect),`
			`run_time = 2`
			`)`
			`for i in range(len(items)):`
			`self.play(items.fade_all_but, i)`
			`self.dither(2)`

			`class TODOInsertFeedForwardAnimations(TODOStub):`
			`CONFIG = {`
			`"message" : "Insert Feed Forward Animations"`
			`}`

			`class TODOInsertStepsDownCostSurface(TODOStub):`
			`CONFIG = {`
			`"message" : "Insert Steps Down Cost Surface"`
			`}`

			`class TODOInsertDefinitionOfCostFunction(TODOStub):`
			`CONFIG = {`
			`"message" : "Insert Definition of cost function"`
			`}`

			`class TODOInsertGradientNudging(TODOStub):`
			`CONFIG = {`
			`"message" : "Insert GradientNudging"`
			`}`

InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`class InterpretGradientComponents(GradientNudging):`
			`CONFIG = {`
			`"network_mob_config" : {`
			`"layer_to_layer_buff" : 3,`
			`},`
			`"stroke_width_exp" : 2,`
			`"n_decimals" : 6,`
			`"n_steps" : 3,`
			`"start_cost" : 3.48,`
			`"delta_cost" : -0.21,`
			`}`
			`def construct(self):`
			`self.setup_network()`
			`self.add_cost()`
			`self.add_gradient()`
			`self.change_weights_repeatedly()`
			`self.ask_about_high_dimensions()`
			`self.circle_magnitudes()`
			`self.isolate_particular_weights()`
			`self.shift_cost_expression()`
			`self.tweak_individual_weights()`

			`def setup_network(self):`
			`self.network_mob.scale(0.55)`
			`self.network_mob.to_corner(UP+RIGHT)`
			`self.color_network_edges()`

			`def add_cost(self):`
			`rect = SurroundingRectangle(self.network_mob)`
			`rect.highlight(RED)`
			`arrow = Vector(DOWN, color = RED)`
			`arrow.shift(rect.get_bottom())`
			`cost = DecimalNumber(self.start_cost)`
			`cost.highlight(RED)`
			`cost.next_to(arrow, DOWN)`

			`cost_expression = TexMobject(`
			`"C(", "w_0, w_1, \\dots, w_{13{,}001}", ")", "="`
			`)`
			`for tex in "()":`
			`cost_expression.highlight_by_tex(tex, RED)`
			`cost_expression.next_to(cost, DOWN)`
			`cost_group = VGroup(cost_expression, cost)`
			`cost_group.arrange_submobjects(RIGHT)`
			`cost_group.next_to(arrow, DOWN)`

			`self.add(rect, arrow, cost_group)`

			`self.set_variables_as_attrs(`
			`cost, cost_expression, cost_group,`
			`network_rect = rect`
			`)`

			`def change_weights_repeatedly(self):`
			`decimals = self.grad_vect.decimals`
			`grad_terms = self.grad_vect.contents`
			`edges = VGroup(*reversed(list(`
			`it.chain(*self.network_mob.edge_groups)`
			`)))`
			`cost = self.cost`

			`for x in range(self.n_steps):`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`self.move_grad_terms_into_position(`
			`grad_terms.copy(),`
			`*self.get_weight_adjustment_anims(edges, cost)`
			`)`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`self.play(*self.get_decimal_change_anims(decimals))`

			`def ask_about_high_dimensions(self):`
			`grad_vect = self.grad_vect`

			`words = TextMobject(`
			`"Direction in \\\\ ${13{,}002}$ dimensions?!?")`
			`words.highlight(YELLOW)`
			`words.move_to(grad_vect).to_edge(DOWN)`
			`arrow = Arrow(`
			`words.get_top(),`
			`grad_vect.get_bottom(),`
			`buff = SMALL_BUFF`
			`)`

			`randy = Randolph()`
			`randy.scale(0.6)`
			`randy.next_to(words, LEFT)`
			`randy.shift_onto_screen()`

			`self.play(`
			`Write(words, run_time = 2),`
			`GrowArrow(arrow),`
			`)`
			`self.play(FadeIn(randy))`
			`self.play(randy.change, "confused", words)`
			`self.play(Blink(randy))`
			`self.dither()`
			`self.play(*map(FadeOut, [randy, words, arrow]))`

			`def circle_magnitudes(self):`
			`rects = VGroup()`
			`for decimal in self.grad_vect.decimals:`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`rects.add(SurroundingRectangle(VGroup(*decimal[-5:])))`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`rects.highlight(WHITE)`

			`self.play(LaggedStart(ShowCreation, rects))`
			`self.play(FadeOut(rects))`

			`def isolate_particular_weights(self):`
			`vect_contents = self.grad_vect.contents`
			`w_terms = self.cost_expression[1]`

			`edges = self.network_mob.edge_groups`
			`edge1 = self.network_mob.layers[1].neurons[3].edges_in[0].copy()`
			`edge2 = self.network_mob.layers[1].neurons[9].edges_in[15].copy()`
			`VGroup(edge1, edge2).set_stroke(width = 4)`
			`d1 = DecimalNumber(3.2)`
			`d2 = DecimalNumber(0.1)`
			`VGroup(edge1, d1).highlight(YELLOW)`
			`VGroup(edge2, d2).highlight(MAROON_B)`
			`new_vect_contents = VGroup(`
			`TexMobject("\\vdots"),`
			`d1, TexMobject("\\vdots"),`
			`d2, TexMobject("\\vdots"),`
			`)`
			`new_vect_contents.arrange_submobjects(DOWN)`
			`new_vect_contents.move_to(vect_contents)`

			`new_w_terms = TexMobject(`
			`"\\dots", "w_n", "\\dots", "w_k", "\\dots"`
			`)`
			`new_w_terms.move_to(w_terms, DOWN)`
			`new_w_terms[1].highlight(d1.get_color())`
			`new_w_terms[3].highlight(d2.get_color())`

			`for d, edge in (d1, edge1), (d2, edge2):`
			`d.arrow = Arrow(`
			`d.get_right(), edge.get_center(),`
			`color = d.get_color()`
			`)`

			`self.play(`
			`FadeOut(vect_contents),`
			`FadeIn(new_vect_contents),`
			`FadeOut(w_terms),`
			`FadeIn(new_w_terms),`
			`edges.set_stroke, LIGHT_GREY, 0.35,`
			`)`
			`self.play(GrowArrow(d1.arrow))`
			`self.play(ShowCreation(edge1))`
			`self.dither()`
			`self.play(GrowArrow(d2.arrow))`
			`self.play(ShowCreation(edge2))`
			`self.dither(2)`

			`self.cost_expression.remove(w_terms)`
			`self.cost_expression.add(new_w_terms)`
			`self.set_variables_as_attrs(`
			`edge1, edge2, new_w_terms,`
			`new_decimals = VGroup(d1, d2)`
			`)`

			`def shift_cost_expression(self):`
			`self.play(self.cost_group.shift, DOWN+0.5*LEFT)`

			`def tweak_individual_weights(self):`
			`cost = self.cost`
			`cost_num = cost.number`
			`edges = VGroup(self.edge1, self.edge2)`
			`decimals = self.new_decimals`
			`changes = (1.0, 1./32)`
			`wn = self.new_w_terms[1]`
			`wk = self.new_w_terms[3]`

			`number_line_template = NumberLine(`
			`x_min = -1,`
			`x_max = 1,`
			`tick_frequency = 0.25,`
			`numbers_with_elongated_ticks = [],`
			`color = WHITE`
			`)`
			`for term in wn, wk, cost:`
			`term.number_line = number_line_template.copy()`
			`term.brace = Brace(term.number_line, DOWN, buff = SMALL_BUFF)`
			`group = VGroup(term.number_line, term.brace)`
			`group.next_to(term, UP)`
			`term.dot = Dot()`
			`term.dot.highlight(term.get_color())`
			`term.dot.move_to(term.number_line.get_center())`
			`term.dot.save_state()`
			`term.dot.move_to(term)`
			`term.dot.set_fill(opacity = 0)`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`term.words = TextMobject("Nudge this weight")`
			`term.words.scale(0.7)`
			`term.words.next_to(term.number_line, UP, MED_SMALL_BUFF)`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00
			`groups = [`
			`VGroup(d, d.arrow, edge, w)`
			`for d, edge, w in zip(decimals, edges, [wn, wk])`
			`]`
			`for group in groups:`
			`group.save_state()`

			`for i in range(2):`
			`group1, group2 = groups[i], groups[1-i]`
			`change = changes[i]`
			`edge = edges[i]`
			`w = group1[-1]`
			`added_anims = []`
			`if i == 0:`
			`added_anims = [`
			`GrowFromCenter(cost.brace),`
			`ShowCreation(cost.number_line),`
			`cost.dot.restore`
			`]`
			`self.play(`
			`group1.restore,`
			`group2.fade, 0.7,`
			`GrowFromCenter(w.brace),`
			`ShowCreation(w.number_line),`
			`w.dot.restore,`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`Write(w.words, run_time = 1),`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`*added_anims`
			`)`
			`for x in range(2):`
			`func = lambda a : interpolate(`
			`cost_num, cost_num-change, a`
			`)`
			`self.play(`
			`ChangingDecimal(cost, func),`
			`cost.dot.shift, change*RIGHT,`
			`w.dot.shift, 0.25*RIGHT,`
			`edge.set_stroke, None, 8,`
			`rate_func = lambda t : wiggle(t, 4),`
			`run_time = 2,`
			`)`
			`self.dither()`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`self.play(*map(FadeOut, [`
			`w.dot, w.brace, w.number_line, w.words`
			`]))`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00

			`######`

ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`def move_grad_terms_into_position(self, grad_terms, *added_anims):`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`cost_expression = self.cost_expression`
			`w_terms = self.cost_expression[1]`
			`points = VGroup(*[`
			`VectorizedPoint()`
			`for term in grad_terms`
			`])`
			`points.arrange_submobjects(RIGHT)`
			`points.replace(w_terms, dim_to_match = 0)`

			`grad_terms.generate_target()`
			`grad_terms.target[len(grad_terms)/2].rotate(np.pi/2)`
			`grad_terms.target.arrange_submobjects(RIGHT)`
			`grad_terms.target.scale_to_fit_width(cost_expression.get_width())`
			`grad_terms.target.next_to(cost_expression, DOWN)`

			`words = TextMobject("Nudge weights")`
			`words.scale(0.8)`
			`words.next_to(grad_terms.target, DOWN)`

			`self.play(`
			`MoveToTarget(grad_terms),`
			`FadeIn(words)`
			`)`
			`self.play(`
			`Transform(`
			`grad_terms, points,`
			`remover = True,`
			`submobject_mode = "lagged_start",`
			`run_time = 1`
			`),`
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`FadeOut(words),`
			`*added_anims`
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`)`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
InterpretGradientComponents in nn/part3 2017-10-20 16:30:33 -07:00			`def get_weight_adjustment_anims(self, edges, cost):`
			`start_cost = cost.number`
			`target_cost = start_cost + self.delta_cost`
			`w_terms = self.cost_expression[1]`

			`return [`
			`self.get_edge_change_anim(edges),`
			`LaggedStart(`
			`Indicate, w_terms,`
			`rate_func = there_and_back,`
			`run_time = 1.5,`
			`),`
			`ChangingDecimal(`
			`cost,`
			`lambda a : interpolate(start_cost, target_cost, a),`
			`run_time = 1.5`
			`)`
			`]`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
GetLostInNotation in nn/part3 2017-10-20 17:10:47 -07:00			`class GetLostInNotation(PiCreatureScene):`
			`def construct(self):`
			`morty = self.pi_creature`
			`equations = VGroup(`
			`TexMobject(`
			`"\\delta", "^L", "=", "\\nabla_a", "C",`
			`"\\odot \\sigma'(", "z", "^L)"`
			`),`
			`TexMobject(`
			`"\\delta", "^l = ((", "w", "^{l+1})^T",`
			`"\\delta", "^{l+1}) \\odot \\sigma'(", "z", "^l)"`
			`),`
			`TexMobject(`
			`"{\\partial", "C", "\\over \\partial", "b",`
			`"_j^l} =", "\\delta", "_j^l"`
			`),`
			`TexMobject(`
			`"{\\partial", "C", " \\over \\partial",`
			`"w", "_{jk}^l} = ", "a", "_k^{l-1}", "\\delta", "_j^l"`
			`),`
			`)`
			`for equation in equations:`
			`equation.highlight_by_tex_to_color_map({`
			`"\\delta" : YELLOW,`
			`"C" : RED,`
			`"b" : MAROON_B,`
			`"w" : BLUE,`
			`"z" : TEAL,`
			`})`
			`equation.highlight_by_tex("nabla", WHITE)`
			`equations.arrange_submobjects(`
			`DOWN, buff = MED_LARGE_BUFF, aligned_edge = LEFT`
			`)`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
GetLostInNotation in nn/part3 2017-10-20 17:10:47 -07:00			`circle = Circle(radius = 3*SPACE_WIDTH)`
			`circle.set_fill(WHITE, 0)`
			`circle.set_stroke(WHITE, 0)`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
GetLostInNotation in nn/part3 2017-10-20 17:10:47 -07:00			`self.play(`
			`Write(equations),`
			`morty.change, "confused", equations`
			`)`
			`self.dither()`
			`self.play(morty.change, "pleading")`
			`self.dither(2)`

			`##`
			`movers = VGroup(*equations.family_members_with_points())`
			`random.shuffle(movers.submobjects)`
			`for mover in list(movers):`
			`if mover.is_subpath:`
			`movers.remove(mover)`
			`continue`
			`mover.set_stroke(WHITE, width = 0)`
			`mover.target = Circle()`
			`mover.target.scale(0.5)`
			`mover.target.set_fill(mover.get_color(), opacity = 0)`
			`mover.target.set_stroke(BLACK, width = 1)`
			`mover.target.move_to(mover)`
			`self.play(`
			`LaggedStart(`
			`MoveToTarget, movers,`
			`run_time = 2,`
			`),`
			`morty.change, "pondering",`
			`)`
			`self.dither()`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
GetLostInNotation in nn/part3 2017-10-20 17:10:47 -07:00			`class TODOInsertPreviewLearning(TODOStub):`
			`CONFIG = {`
			`"message" : "Insert PreviewLearning"`
			`}`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`class ShowAveragingCost(PreviewLearning):`
			`CONFIG = {`
			`"network_scale_val" : 0.8,`
			`"stroke_width_exp" : 1,`
			`"start_examples_time" : 5,`
			`"examples_per_adjustment_time" : 2,`
			`"n_adjustments" : 5,`
			`"time_per_example" : 1./15,`
			`"image_height" : 1.2,`
			`}`
			`def construct(self):`
			`self.setup_network()`
			`self.setup_diff_words()`
			`self.show_many_examples()`

			`def setup_network(self):`
			`self.network_mob.scale(self.network_scale_val)`
			`self.network_mob.to_edge(DOWN)`
			`self.network_mob.shift(LEFT)`
			`self.color_network_edges()`

			`def setup_diff_words(self):`
			`last_layer_copy = self.network_mob.layers[-1].deepcopy()`
			`last_layer_copy.add(self.network_mob.output_labels.copy())`
			`last_layer_copy.shift(1.5*RIGHT)`

			`double_arrow = DoubleArrow(`
			`self.network_mob.output_labels,`
			`last_layer_copy,`
			`color = RED`
			`)`
			`brace = Brace(`
			`VGroup(self.network_mob.layers[-1], last_layer_copy),`
			`UP`
			`)`
			`cost_words = brace.get_text("Cost of \\\\ one example")`
			`cost_words.highlight(RED)`

			`self.add(last_layer_copy, double_arrow, brace, cost_words)`
			`self.set_variables_as_attrs(`
			`last_layer_copy, double_arrow, brace, cost_words`
			`)`
			`self.last_layer_copy = last_layer_copy`

			`def show_many_examples(self):`
			`training_data, validation_data, test_data = load_data_wrapper()`
			`training_data_iter = iter(training_data)`

			`average_words = TextMobject("Average over all training examples")`
			`average_words.next_to(LEFT, RIGHT)`
			`average_words.to_edge(UP)`
			`self.add(average_words)`

			`for x in xrange(int(self.start_examples_time/self.time_per_example)):`
			`train_in, train_out = training_data_iter.next()`
			`self.show_one_example(train_in, train_out)`
			`self.dither(self.time_per_example)`

			`#Wiggle all edges`
			`edges = VGroup(it.chain(self.network_mob.edge_groups))`
			`reversed_edges = VGroup(*reversed(edges))`
			`self.play(LaggedStart(`
			`ApplyFunction, edges,`
			`lambda edge : (`
			`lambda m : m.rotate_in_place(np.pi/12).highlight(YELLOW),`
			`edge,`
			`),`
			`rate_func = lambda t : wiggle(t, 4),`
			`run_time = 3,`
			`))`

			`#Show all, then adjust`
			`words = TextMobject(`
			`"Each step \\\\ uses every \\\\ example\\\\",`
			`"$\\dots$theoretically",`
			`alignment = ""`
			`)`
			`words.highlight(YELLOW)`
			`words.scale(0.8)`
			`words.to_corner(UP+LEFT)`

			`for x in xrange(self.n_adjustments):`
			`for y in xrange(int(self.examples_per_adjustment_time/self.time_per_example)):`
			`train_in, train_out = training_data_iter.next()`
			`self.show_one_example(train_in, train_out)`
			`self.dither(self.time_per_example)`
			`self.play(LaggedStart(`
			`ApplyMethod, reversed_edges,`
			`lambda m : (m.rotate_in_place, np.pi),`
			`run_time = 1,`
			`lag_ratio = 0.2,`
			`))`
			`if x < 2:`
			`self.play(FadeIn(words[x]))`
			`else:`
			`self.dither()`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`####`

			`def show_one_example(self, train_in, train_out):`
			`if hasattr(self, "curr_image"):`
			`self.remove(self.curr_image)`
			`image = MNistMobject(train_in)`
			`image.scale_to_fit_height(self.image_height)`
			`image.next_to(`
			`self.network_mob.layers[0].neurons, UP,`
			`aligned_edge = LEFT`
			`)`
			`self.add(image)`
			`self.network_mob.activate_layers(train_in)`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`index = np.argmax(train_out)`
			`self.last_layer_copy.neurons.set_fill(opacity = 0)`
			`self.last_layer_copy.neurons[index].set_fill(WHITE, opacity = 1)`
			`self.add(self.last_layer_copy)`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00
ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`self.curr_iamge = image`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00

ShowAveragingCost of nn/part3 2017-10-23 15:48:05 -07:00			`class WalkThroughTwoExample(ShowAveragingCost):`
			`def construct(self):`
			`self.force_skipping()`

			`self.setup_network()`
			`self.setup_diff_words()`
			`self.show_single_example()`
			`self.expand_last_layer()`
			`self.cannot_directly_affect_activations()`
			`self.show_desired_activation_nudges()`
			`self.focus_on_one_neuron()`
			`self.show_activation_formula()`
			`self.three_ways_to_increase()`
			`self.note_connections_to_brightest_neurons()`

			`def show_single_example(self):`
			`two_vect = get_organized_images()[2][0]`
			`two_out = np.zeroes(10)`
			`two_out[2] = 1.0`
			`self.show_one_example(two_vect, two_out)`
			`for layer in self.network_mob.layers:`
			`layer.neurons.set_fill(opacity = 0)`

			`self.revert_to_original_skipping_status()`
			`self.feed_forward(two_vect)`

			`def expand_last_layer(self):`
			`pass`

			`def cannot_directly_affect_activations(self):`
			`pass`

			`def show_desired_activation_nudges(self):`
			`pass`

			`def focus_on_one_neuron(self):`
			`pass`

			`def show_activation_formula(self):`
			`pass`

			`def three_ways_to_increase(self):`
			`pass`

			`def note_connections_to_brightest_neurons(self):`
			`pass`
Beginning backpropagation animations 2017-10-19 14:32:26 -07:00