.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python %matplotlib inline from mxnet import autograd, np, npx from d2l import mxnet as d2l npx.set_np() x = np.arange(-8.0, 8.0, 0.1) x.attach_grad() with autograd.record(): y = npx.sigmoid(x) y.backward() d2l.plot(x, [y, x.grad], legend=['sigmoid', 'gradient'], figsize=(4.5, 2.5)) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output [07:03:21] ../src/storage/storage.cc:196: Using Pooled (Naive) StorageManager for CPU [07:03:21] ../src/base.cc:48: GPU context requested, but no GPUs found. .. figure:: output_numerical-stability-and-init_e60514_3_1.svg .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python %matplotlib inline import torch from d2l import torch as d2l x = torch.arange(-8.0, 8.0, 0.1, requires_grad=True) y = torch.sigmoid(x) y.backward(torch.ones_like(x)) d2l.plot(x.detach().numpy(), [y.detach().numpy(), x.grad.numpy()], legend=['sigmoid', 'gradient'], figsize=(4.5, 2.5)) .. figure:: output_numerical-stability-and-init_e60514_6_0.svg .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python %matplotlib inline import tensorflow as tf from d2l import tensorflow as d2l x = tf.Variable(tf.range(-8.0, 8.0, 0.1)) with tf.GradientTape() as t: y = tf.nn.sigmoid(x) d2l.plot(x.numpy(), [y.numpy(), t.gradient(y, x).numpy()], legend=['sigmoid', 'gradient'], figsize=(4.5, 2.5)) .. figure:: output_numerical-stability-and-init_e60514_9_0.svg .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python %matplotlib inline import warnings from d2l import paddle as d2l warnings.filterwarnings("ignore") import paddle x = paddle.arange(start=-8.0, end=8.0, step=0.1, dtype='float32') x.stop_gradient = False y = paddle.nn.functional.sigmoid(x) y.backward(paddle.ones_like(x)) d2l.plot(x.detach().numpy(), [y.detach().numpy(), x.grad.numpy()], legend=['sigmoid', 'gradient'], figsize=(4.5, 2.5)) .. figure:: output_numerical-stability-and-init_e60514_12_0.svg .. raw:: html

.. raw:: html

mxnet pytorch tensorflow paddle

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python M = np.random.normal(size=(4, 4)) print('一个矩阵 \n', M) for i in range(100): M = np.dot(M, np.random.normal(size=(4, 4))) print('乘以100个矩阵后\n', M) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output 一个矩阵 [[ 2.2122064 1.1630787 0.7740038 0.4838046 ] [ 1.0434403 0.29956347 1.1839255 0.15302546] [ 1.8917114 -1.1688148 -1.2347414 1.5580711 ] [-1.771029 -0.5459446 -0.45138445 -2.3556297 ]] 乘以100个矩阵后 [[ 3.4459747e+23 -7.8040759e+23 5.9973355e+23 4.5230040e+23] [ 2.5275059e+23 -5.7240258e+23 4.3988419e+23 3.3174704e+23] [ 1.3731275e+24 -3.1097129e+24 2.3897754e+24 1.8022945e+24] [-4.4951091e+23 1.0180045e+24 -7.8232368e+23 -5.9000419e+23]] .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python M = torch.normal(0, 1, size=(4,4)) print('一个矩阵 \n',M) for i in range(100): M = torch.mm(M,torch.normal(0, 1, size=(4, 4))) print('乘以100个矩阵后\n', M) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output 一个矩阵 tensor([[-0.7872, 2.7090, 0.5996, -1.3191], [-1.8260, -0.7130, -0.5521, 0.1051], [ 1.1213, 1.0472, -0.3991, -0.3802], [ 0.5552, 0.4517, -0.3218, 0.5214]]) 乘以100个矩阵后 tensor([[-2.1897e+26, 8.8308e+26, 1.9813e+26, 1.7019e+26], [ 1.3110e+26, -5.2870e+26, -1.1862e+26, -1.0189e+26], [-1.6008e+26, 6.4559e+26, 1.4485e+26, 1.2442e+26], [ 3.0943e+25, -1.2479e+26, -2.7998e+25, -2.4050e+25]]) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python M = tf.random.normal((4, 4)) print('一个矩阵 \n', M) for i in range(100): M = tf.matmul(M, tf.random.normal((4, 4))) print('乘以100个矩阵后\n', M.numpy()) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output 一个矩阵 tf.Tensor( [[ 0.2560883 0.00797761 -1.0682204 -0.16417116] [ 2.0060067 0.3481633 -0.74592876 1.2011837 ] [ 0.21468055 0.09542773 -0.40310776 0.17152807] [-1.077096 -0.8505044 -2.3125033 -1.2070065 ]], shape=(4, 4), dtype=float32) 乘以100个矩阵后 [[-4.5526118e+23 1.2209238e+23 -5.6382419e+22 1.4789259e+23] [-2.1546440e+24 5.7783439e+23 -2.6684469e+23 6.9994081e+23] [-4.0427488e+23 1.0841861e+23 -5.0067922e+22 1.3132947e+23] [-1.7901018e+23 4.8007174e+22 -2.2169757e+22 5.8151884e+22]] .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python M = paddle.normal(0, 1, shape=(4,4)) print('一个矩阵 \n',M) for i in range(100): M = paddle.mm(M, paddle.normal(0, 1, shape=(4, 4))) print('乘以100个矩阵后\n', M) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output 一个矩阵 Tensor(shape=[4, 4], dtype=float32, place=Place(cpu), stop_gradient=True, [[ 0.09555759, 0.33683282, 1.20171154, 1.25189281], [-0.18284278, -0.65445828, 0.14309669, 0.55920464], [ 0.97072512, -0.47076491, -2.04063487, -0.57572478], [ 1.14641619, 1.06490767, 0.76046497, -0.27298930]]) 乘以100个矩阵后 Tensor(shape=[4, 4], dtype=float32, place=Place(cpu), stop_gradient=True, [[-1939696468398394579091456., -2089295959956477146300416., 2721163381582732258705408., -3558180070471660887605248.], [-307949261019363894362112. , -331699912388626188599296. , 432016261022814285332480. , -564902317902972638461952. ], [ 2247077303087190278930432., 2420383743083751137083392., -3152382253269922833498112., 4122040255420859993292800.], [ 169666774892908099141632. , 182752361912601774391296. , -238022355993941958983680. , 311236780660953299550208. ]]) .. raw:: html

.. raw:: html