Iter #50: tensor([[ 0.1610,  0.0355],
        [ 0.1568,  0.1386],
        [-0.0111,  0.2204],
        [ 0.0130,  0.2152],
        [ 0.0978,  0.3584],
        [ 0.1450,  0.0306],
        [ 0.1529,  0.2523],
        [ 0.1032,  0.1583],
        [ 0.0816,  0.0105],
        [ 0.2732,  0.1838],
        [ 0.0863,  0.1492],
        [ 0.0606,  0.2493]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0007,  0.0239],
        [ 0.0046,  0.0351],
        [ 0.1405,  0.1652],
        [ 0.1003,  0.1037],
        [ 0.0964,  0.1106],
        [ 0.1712,  0.1200],
        [ 0.2066,  0.0615],
        [-0.2633,  0.3192],
        [ 0.1522,  0.3507],
        [ 0.0761,  0.1437],
        [ 0.0183,  0.1611],
        [ 0.1331,  0.3392]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.2056, -0.0165],
        [ 0.1736,  0.0124],
        [ 0.1896,  0.1476],
        [ 0.2663,  0.2542],
        [ 0.0994,  0.1105],
        [ 0.0915,  0.1320],
        [ 0.1555,  0.1930],
        [ 0.1847,  0.2362],
        [ 0.0605,  0.2365],
        [ 0.1457,  0.0292],
        [-0.0348,  0.1478],
        [ 0.1368,  0.2264]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0513,  0.2549],
        [ 0.0878,  0.3296],
        [ 0.1554,  0.3168],
        [ 0.1128,  0.1897],
        [-0.1224,  0.0817],
        [ 0.1639,  0.2228],
        [ 0.1270,  0.2118],
        [ 0.0960,  0.1063],
        [ 0.1945,  0.2078],
        [-0.0517,  0.2025],
        [ 0.1366,  0.1625],
        [ 0.0839,  0.1385]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0738,  0.2088],
        [ 0.0145,  0.1988],
        [ 0.1931,  0.1940],
        [ 0.0310,  0.2922],
        [ 0.2141,  0.2787],
        [-0.0368,  0.2268],
        [ 0.0230,  0.1782],
        [ 0.1575,  0.2249],
        [ 0.0149,  0.2145],
        [ 0.0988,  0.2367],
        [ 0.0427,  0.3253],
        [ 0.1315,  0.1350]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0109,  0.2274],
        [ 0.3018,  0.2088],
        [-0.0070,  0.2522],
        [ 0.1284,  0.2074],
        [ 0.3617,  0.1509],
        [ 0.3164,  0.0794],
        [ 0.2234,  0.0915],
        [ 0.1411,  0.2250],
        [ 0.0222,  0.2098],
        [-0.0432,  0.2414],
        [ 0.3267,  0.0049],
        [ 0.2156,  0.2453]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1757,  0.3387],
        [ 0.0506,  0.2706],
        [ 0.2099,  0.2098],
        [-0.1822,  0.2380],
        [ 0.1277,  0.2154],
        [ 0.2024,  0.1476],
        [ 0.1612,  0.2413],
        [ 0.0367,  0.1368],
        [ 0.0647,  0.1849],
        [ 0.1882,  0.1199],
        [ 0.0911,  0.2069],
        [ 0.1236,  0.2230]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0597,  0.2334],
        [-0.0834,  0.2987],
        [ 0.1793,  0.2115],
        [-0.0274,  0.1542],
        [ 0.2060,  0.2327],
        [ 0.0347,  0.2550],
        [ 0.0621,  0.2707],
        [-0.0378,  0.2598],
        [ 0.0127,  0.2521],
        [ 0.0248,  0.1635],
        [ 0.0434,  0.2838],
        [-0.0313,  0.2852]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1251,  0.2809],
        [-0.0774,  0.0709],
        [ 0.0529,  0.1138],
        [ 0.0682,  0.1695],
        [ 0.0160,  0.0889],
        [ 0.1189,  0.1612],
        [-0.0154,  0.1999],
        [ 0.1600,  0.1909],
        [ 0.0886,  0.3053],
        [-0.0406,  0.2299],
        [ 0.0856,  0.1508],
        [ 0.0593,  0.0509]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0648,  0.2800],
        [-0.1207,  0.0929],
        [ 0.1672,  0.1526],
        [-0.0422,  0.3465],
        [ 0.0900,  0.1354],
        [ 0.1443,  0.3290],
        [ 0.0268,  0.0902],
        [ 0.1827,  0.2649],
        [-0.0550,  0.2873],
        [ 0.1470,  0.2917],
        [ 0.0291,  0.1682],
        [-0.1120,  0.6097]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0670,  0.2026],
        [ 0.1297,  0.1729],
        [ 0.0941,  0.1555],
        [ 0.0541,  0.3270],
        [ 0.1179,  0.2428],
        [ 0.2101,  0.2162],
        [-0.0038,  0.3376],
        [ 0.0873,  0.1719],
        [-0.1486,  0.1566],
        [ 0.3334,  0.1954],
        [ 0.1846,  0.1801],
        [ 0.1754,  0.3118]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0180,  0.2752],
        [-0.1948,  0.3589],
        [ 0.0827,  0.2173],
        [ 0.0843,  0.2704],
        [ 0.0708,  0.2113],
        [ 0.1898,  0.2403],
        [ 0.1212,  0.2119],
        [ 0.0854,  0.1725],
        [-0.1439,  0.3158],
        [ 0.0265,  0.2007],
        [ 0.1563,  0.1926],
        [ 0.1318,  0.2950]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0040,  0.4523],
        [ 0.1359,  0.2737],
        [-0.0439,  0.2297],
        [ 0.0208,  0.2147],
        [ 0.0412,  0.0100],
        [ 0.1370,  0.1680],
        [ 0.1025,  0.2359],
        [-0.0326,  0.2153],
        [ 0.1278,  0.3058],
        [-0.0319,  0.2837],
        [-0.0994,  0.4090],
        [ 0.0825,  0.1542]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 2.0197e-02,  2.8402e-01],
        [-2.0242e-04, -6.4354e-03],
        [ 9.8609e-02,  9.0170e-02],
        [ 1.1278e-01,  4.0510e-01],
        [ 2.2630e-01,  1.7128e-01],
        [ 5.6523e-02,  1.6791e-01],
        [ 1.2019e-01,  1.1951e-01],
        [ 1.4132e-01,  2.5156e-01],
        [ 1.9712e-01,  2.6665e-01],
        [ 2.3351e-01,  2.7398e-02],
        [ 2.8919e-04,  1.9984e-01],
        [-1.0822e-01,  1.9158e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1454,  0.2257],
        [ 0.1711,  0.3376],
        [ 0.0937,  0.3097],
        [ 0.1719,  0.1506],
        [-0.1727,  0.3010],
        [ 0.2394,  0.1726],
        [-0.0865,  0.1408],
        [ 0.1909,  0.0962],
        [ 0.1842,  0.1830],
        [ 0.1034,  0.2084],
        [ 0.1798,  0.2312],
        [ 0.0140,  0.2615]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.1488,  0.2225],
        [ 0.0831,  0.1105],
        [ 0.0161,  0.1911],
        [ 0.0693,  0.1879],
        [ 0.2034,  0.1252],
        [ 0.2477,  0.1593],
        [ 0.1464,  0.0836],
        [-0.0942,  0.3141],
        [-0.0788,  0.2847],
        [ 0.0206,  0.2943],
        [ 0.1902,  0.2477],
        [-0.0835,  0.2666]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.1020,  0.2645],
        [ 0.3033,  0.2552],
        [ 0.0838,  0.2518],
        [ 0.0611,  0.1457],
        [ 0.3244,  0.2161],
        [ 0.1083,  0.1732],
        [-0.0822,  0.2984],
        [ 0.1162,  0.1813],
        [-0.0456,  0.1319],
        [ 0.0923,  0.1922],
        [ 0.1161,  0.1581],
        [-0.0419,  0.2650]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.2127,  0.2517],
        [ 0.2116,  0.2358],
        [-0.0016,  0.2196],
        [-0.3020,  0.2775],
        [ 0.0393,  0.1239],
        [ 0.2012,  0.1040],
        [ 0.0522,  0.0790],
        [-0.0996,  0.3222],
        [ 0.0537,  0.1670],
        [ 0.0905,  0.1628],
        [ 0.1105,  0.0528],
        [ 0.1397,  0.1739]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 9.0261e-02,  2.3689e-01],
        [ 2.9976e-02,  8.8643e-02],
        [ 1.2996e-01,  1.8186e-01],
        [ 1.8175e-04,  3.0984e-01],
        [ 2.6155e-02,  2.7758e-01],
        [-1.6259e-01,  1.9606e-01],
        [-4.1224e-03,  1.4904e-01],
        [ 1.5052e-01,  2.1940e-01],
        [ 9.5537e-02,  1.6721e-01],
        [-9.6815e-02,  3.5912e-01],
        [ 1.7735e-01,  2.2410e-01],
        [-1.6470e-01,  4.3903e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0880,  0.2500],
        [-0.2424,  0.3107],
        [-0.1402,  0.2531],
        [-0.1159,  0.1584],
        [-0.0882,  0.1814],
        [-0.0404,  0.2095],
        [-0.2449,  0.2500],
        [ 0.1948,  0.2377],
        [-0.0445,  0.1494],
        [ 0.0114,  0.2971],
        [ 0.1775,  0.1732],
        [-0.0956,  0.1983]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0139,  0.1925],
        [ 0.1657,  0.2312],
        [ 0.0927,  0.0752],
        [ 0.0460,  0.4155],
        [ 0.1664,  0.2148],
        [ 0.0744,  0.2956],
        [-0.0338,  0.1947],
        [ 0.1997,  0.1289],
        [ 0.0475,  0.2058],
        [ 0.1008,  0.2061],
        [ 0.1091,  0.3393],
        [ 0.0597,  0.4580]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0705,  0.2052],
        [-0.0314,  0.3214],
        [-0.0340,  0.3248],
        [-0.1135,  0.1715],
        [ 0.0482,  0.2201],
        [ 0.1819,  0.2737],
        [-0.1551,  0.2189],
        [-0.0889,  0.1450],
        [-0.1618,  0.2721],
        [ 0.1348,  0.2624],
        [ 0.1803,  0.1905],
        [ 0.1741,  0.3486]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.1144,  0.3868],
        [-0.1072,  0.1104],
        [-0.1294,  0.2379],
        [ 0.0738,  0.3310],
        [ 0.0553,  0.4730],
        [-0.0225,  0.1598],
        [-0.0483,  0.2677],
        [-0.0091,  0.2664],
        [-0.2152,  0.2412],
        [-0.3224,  0.3620],
        [ 0.0832,  0.0723],
        [ 0.0247,  0.2932]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2041,  0.4849],
        [-0.2782,  0.2659],
        [ 0.1131,  0.2978],
        [-0.0192,  0.2514],
        [ 0.0952,  0.1545],
        [ 0.0823,  0.2671],
        [-0.2161,  0.2942],
        [-0.1023,  0.0987],
        [ 0.0287,  0.3837],
        [-0.0818,  0.3276],
        [-0.1326,  0.4007],
        [-0.0817,  0.3914]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.1765,  0.1710],
        [-0.0343,  0.0927],
        [-0.1468,  0.2306],
        [-0.1676,  0.2234],
        [-0.1191,  0.3185],
        [ 0.0101,  0.3264],
        [-0.0668,  0.1279],
        [ 0.0730,  0.2767],
        [ 0.0091,  0.4115],
        [ 0.0217,  0.2011],
        [-0.1276,  0.3547],
        [ 0.0080,  0.1645]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.1137,  0.4170],
        [ 0.0861,  0.3384],
        [-0.0568,  0.5465],
        [-0.0568,  0.2251],
        [-0.1249,  0.2136],
        [ 0.0529,  0.2396],
        [-0.1364,  0.3991],
        [-0.0187,  0.2428],
        [ 0.1421,  0.2644],
        [ 0.0099,  0.3240],
        [-0.0022,  0.1694],
        [-0.0298,  0.2497]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0476,  0.2594],
        [-0.0454,  0.1917],
        [ 0.1219,  0.2548],
        [ 0.0213,  0.2574],
        [ 0.1369,  0.1809],
        [ 0.1319,  0.2079],
        [-0.1140,  0.3079],
        [ 0.0039,  0.2078],
        [ 0.0150,  0.1652],
        [-0.1018,  0.1621],
        [-0.0140,  0.2911],
        [ 0.0260,  0.3107]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1272,  0.1374],
        [ 0.1139,  0.2744],
        [-0.0144,  0.4022],
        [ 0.0445,  0.3945],
        [ 0.0935,  0.3229],
        [ 0.1668,  0.0727],
        [ 0.0030,  0.0801],
        [-0.0025,  0.3539],
        [-0.1183,  0.2906],
        [ 0.0396,  0.2127],
        [ 0.0364,  0.1808],
        [-0.1452,  0.2108]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0079,  0.2741],
        [ 0.0925,  0.2029],
        [-0.0039,  0.3035],
        [-0.1601,  0.2374],
        [-0.1639,  0.2349],
        [ 0.0952,  0.1700],
        [ 0.0285,  0.2337],
        [-0.1621,  0.2173],
        [-0.2065,  0.2771],
        [-0.0133,  0.3641],
        [-0.0544,  0.2008],
        [-0.0945,  0.2089]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0837,  0.2222],
        [-0.1111,  0.2758],
        [-0.0714,  0.3660],
        [-0.0883,  0.3004],
        [-0.0291,  0.2873],
        [-0.2426,  0.1564],
        [-0.0426,  0.1563],
        [ 0.0916,  0.2646],
        [-0.0249,  0.3278],
        [-0.1459,  0.3207],
        [ 0.0312,  0.2492],
        [-0.0646,  0.2858]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0067,  0.3745],
        [-0.0484,  0.1936],
        [-0.1078,  0.1774],
        [ 0.0648,  0.2410],
        [ 0.0537,  0.2347],
        [-0.0283,  0.1837],
        [-0.0379,  0.2295],
        [ 0.1007,  0.1871],
        [-0.0754,  0.1748],
        [-0.0558,  0.3488],
        [ 0.0557,  0.1188],
        [-0.1040,  0.3053]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 4.8632e-03,  1.5706e-01],
        [ 7.7249e-02,  1.7258e-01],
        [ 1.4868e-01,  7.3946e-02],
        [ 3.3306e-02,  2.1337e-01],
        [-1.9428e-02,  4.5792e-01],
        [-1.3553e-02,  2.3544e-01],
        [-1.4935e-01,  2.1085e-01],
        [-1.6696e-03,  3.8474e-01],
        [-2.0728e-03,  3.1762e-01],
        [ 3.6955e-04,  1.9798e-01],
        [ 2.4919e-01,  3.0328e-01],
        [ 1.4717e-01,  3.6464e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1314,  0.2563],
        [-0.0156,  0.0966],
        [ 0.1043,  0.1928],
        [-0.0080,  0.2129],
        [-0.0757,  0.2669],
        [ 0.0487,  0.2450],
        [-0.0238,  0.2754],
        [-0.0189,  0.2608],
        [-0.1087,  0.1164],
        [-0.0283,  0.2108],
        [ 0.0545,  0.3394],
        [ 0.1330,  0.2027]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0325,  0.2915],
        [-0.1548,  0.2674],
        [-0.1501,  0.1890],
        [-0.0667,  0.2554],
        [-0.0160,  0.2968],
        [ 0.0881,  0.2756],
        [-0.1296,  0.3025],
        [-0.0400,  0.3063],
        [ 0.0413,  0.2768],
        [ 0.0497,  0.2576],
        [-0.0201,  0.2449],
        [ 0.0473,  0.4364]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2119,  0.3465],
        [-0.1499,  0.2067],
        [ 0.0516,  0.2780],
        [-0.0347,  0.2246],
        [-0.0445,  0.2207],
        [-0.0014,  0.3139],
        [-0.0164,  0.1992],
        [-0.2108,  0.1959],
        [ 0.0736,  0.3588],
        [-0.0131,  0.1373],
        [-0.0429,  0.3371],
        [ 0.0479,  0.3603]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0733,  0.1382],
        [-0.0293,  0.1726],
        [-0.0863,  0.1444],
        [-0.1050,  0.4251],
        [ 0.0735,  0.2698],
        [ 0.0869,  0.3038],
        [-0.1070,  0.3070],
        [ 0.0114,  0.2180],
        [ 0.0174,  0.2557],
        [ 0.1277,  0.1429],
        [-0.1643,  0.2310],
        [-0.0022,  0.0449]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0102,  0.2873],
        [ 0.0550,  0.2543],
        [-0.0796,  0.2182],
        [ 0.0532,  0.2348],
        [ 0.0042,  0.2163],
        [-0.0277,  0.3454],
        [-0.0204,  0.2923],
        [ 0.1123,  0.1753],
        [ 0.1395,  0.1289],
        [-0.1419,  0.1363],
        [ 0.0054,  0.1743],
        [ 0.0416,  0.3367]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.1111,  0.1678],
        [-0.0451,  0.3020],
        [ 0.2355,  0.2044],
        [-0.0403,  0.2377],
        [ 0.1537,  0.3793],
        [ 0.0110,  0.1382],
        [ 0.0163,  0.2864],
        [-0.1155,  0.3017],
        [-0.1885,  0.3350],
        [ 0.1031,  0.1744],
        [ 0.0441,  0.2762],
        [ 0.0142,  0.2321]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1670,  0.3201],
        [ 0.0281,  0.2839],
        [-0.0120,  0.2658],
        [ 0.0938,  0.2774],
        [ 0.3368,  0.2187],
        [ 0.2737,  0.0795],
        [-0.0963,  0.2081],
        [-0.0693,  0.3582],
        [-0.0085,  0.3065],
        [ 0.0231,  0.3547],
        [ 0.0127,  0.2157],
        [-0.0421,  0.3516]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 1.8822e-01,  1.8981e-01],
        [ 8.1732e-02,  2.8641e-01],
        [ 7.5922e-02,  1.9041e-01],
        [-1.8142e-04,  8.7950e-02],
        [ 7.2758e-02,  2.1907e-01],
        [ 1.3845e-01,  1.3781e-01],
        [ 1.2447e-02,  3.2366e-01],
        [-9.3073e-02,  8.3170e-02],
        [-1.2597e-01,  2.0090e-01],
        [-1.6057e-03,  4.2874e-01],
        [ 5.0045e-02,  1.7681e-01],
        [-3.3239e-02,  2.7515e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0450,  0.2367],
        [-0.0260,  0.3024],
        [-0.0060,  0.1839],
        [-0.0565,  0.2777],
        [ 0.0455,  0.2240],
        [-0.1094,  0.2272],
        [-0.0214,  0.2431],
        [ 0.0354,  0.2215],
        [ 0.0926,  0.2879],
        [ 0.1205,  0.2269],
        [ 0.0831,  0.2876],
        [ 0.0610,  0.2563]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.2035,  0.3430],
        [-0.0537,  0.2997],
        [-0.0682,  0.2761],
        [ 0.0669,  0.2450],
        [-0.0354,  0.1580],
        [-0.0660,  0.1370],
        [-0.4328,  0.1761],
        [-0.0434,  0.1160],
        [ 0.0432,  0.1734],
        [ 0.0707,  0.1547],
        [ 0.1117,  0.2059],
        [-0.0159,  0.2633]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0430,  0.2085],
        [ 0.0085,  0.2365],
        [ 0.0592,  0.2117],
        [ 0.0661,  0.0734],
        [ 0.0157,  0.3014],
        [-0.0942,  0.3853],
        [-0.1107,  0.1137],
        [ 0.1031,  0.2580],
        [-0.0085,  0.1062],
        [ 0.0192,  0.1735],
        [-0.0172,  0.2098],
        [ 0.0077,  0.2461]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.2398,  0.3753],
        [-0.1169,  0.1951],
        [-0.2245,  0.3410],
        [-0.0006,  0.3033],
        [ 0.0335,  0.3322],
        [ 0.0491,  0.2943],
        [-0.1892,  0.3432],
        [ 0.0489,  0.3856],
        [-0.2028,  0.1540],
        [ 0.0566,  0.0460],
        [ 0.1571,  0.1959],
        [-0.0416,  0.1709]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0041,  0.1120],
        [-0.1537,  0.2803],
        [ 0.0372,  0.1641],
        [ 0.1267,  0.2732],
        [ 0.1703,  0.1122],
        [ 0.0189,  0.2478],
        [ 0.0335,  0.3498],
        [ 0.0766,  0.1908],
        [-0.2095,  0.0386],
        [-0.0934,  0.1763],
        [-0.0930,  0.1844],
        [ 0.0202,  0.3063]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0038,  0.2217],
        [-0.2308,  0.0060],
        [ 0.0723,  0.1671],
        [-0.0390,  0.1420],
        [-0.0478,  0.1781],
        [-0.0055,  0.1500],
        [ 0.0399,  0.2348],
        [ 0.0750,  0.1449],
        [ 0.2034,  0.2336],
        [ 0.0224,  0.1279],
        [ 0.0960,  0.2959],
        [ 0.0734,  0.1745]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0195,  0.2998],
        [-0.1638, -0.1160],
        [-0.2119,  0.2042],
        [-0.0584,  0.3151],
        [ 0.1117,  0.2518],
        [ 0.1541,  0.1259],
        [ 0.0276,  0.1259],
        [ 0.1340,  0.1870],
        [ 0.0927,  0.1698],
        [ 0.1768,  0.1077],
        [-0.0608,  0.2038],
        [ 0.0627,  0.1242]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0332,  0.0636],
        [ 0.1090,  0.1457],
        [ 0.1041,  0.0971],
        [ 0.0311,  0.2363],
        [-0.0444,  0.1564],
        [ 0.1310,  0.1425],
        [-0.1900,  0.2194],
        [-0.0243,  0.0647],
        [ 0.0762,  0.2664],
        [-0.0924,  0.1516],
        [-0.1215,  0.0380],
        [ 0.0048,  0.1748]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.2066,  0.0248],
        [ 0.0592,  0.1930],
        [ 0.0434,  0.2748],
        [ 0.0140,  0.1426],
        [ 0.1040,  0.2815],
        [ 0.1113,  0.1314],
        [ 0.0825,  0.0355],
        [-0.1947,  0.1689],
        [ 0.0624,  0.2171],
        [ 0.0719,  0.1430],
        [ 0.1023,  0.0641],
        [ 0.1573,  0.1276]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0645,  0.1284],
        [ 0.0344,  0.0839],
        [ 0.1113,  0.2462],
        [ 0.0968,  0.1958],
        [ 0.2168,  0.1631],
        [ 0.2082,  0.0480],
        [-0.1136,  0.0520],
        [ 0.1297,  0.1873],
        [ 0.0049,  0.0440],
        [ 0.0335,  0.1109],
        [ 0.0058,  0.1638],
        [-0.0823,  0.3601]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1773,  0.1263],
        [-0.0506,  0.2621],
        [-0.1583,  0.3033],
        [-0.2958,  0.1222],
        [-0.1118,  0.2079],
        [ 0.1576,  0.0790],
        [-0.0876,  0.2757],
        [-0.1445,  0.0489],
        [-0.0501,  0.3100],
        [ 0.0978,  0.3347],
        [-0.0477,  0.2120],
        [ 0.0735,  0.1274]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0589,  0.2110],
        [-0.0106,  0.1950],
        [-0.0565,  0.3033],
        [-0.0601,  0.2013],
        [-0.0135,  0.2939],
        [-0.1008,  0.1167],
        [ 0.1700,  0.1520],
        [-0.0661,  0.1062],
        [ 0.0006,  0.2006],
        [ 0.0510,  0.2356],
        [ 0.0004,  0.3575],
        [-0.2739, -0.0199]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0656,  0.2240],
        [ 0.0944,  0.1811],
        [-0.0405,  0.2610],
        [-0.0752,  0.0720],
        [ 0.0959,  0.1798],
        [ 0.0108,  0.1207],
        [-0.1391,  0.1362],
        [ 0.1448,  0.1658],
        [-0.0935,  0.0285],
        [ 0.0095,  0.1724],
        [ 0.1101,  0.1394],
        [-0.0934,  0.3097]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0258,  0.1763],
        [ 0.0729,  0.1110],
        [ 0.1641,  0.0883],
        [-0.0100,  0.1848],
        [ 0.0022,  0.3220],
        [ 0.0885,  0.0773],
        [-0.1945,  0.2322],
        [ 0.1329,  0.2574],
        [-0.0725,  0.3963],
        [-0.1834,  0.2763],
        [ 0.0239,  0.1903],
        [ 0.0147,  0.2953]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0570,  0.1092],
        [ 0.0552,  0.1573],
        [-0.1710,  0.2121],
        [ 0.0536,  0.1494],
        [ 0.0914,  0.2231],
        [-0.0392,  0.2524],
        [-0.1172,  0.0963],
        [-0.0530,  0.2234],
        [-0.0893, -0.0977],
        [ 0.1054,  0.0612],
        [ 0.0197,  0.2141],
        [ 0.1582, -0.0238]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0901,  0.2091],
        [-0.3488,  0.2392],
        [-0.2854,  0.1262],
        [ 0.0344,  0.1506],
        [ 0.0529,  0.1042],
        [ 0.0703,  0.1200],
        [ 0.0779,  0.1144],
        [-0.0537, -0.0371],
        [-0.1262,  0.0510],
        [-0.0480,  0.2478],
        [ 0.0403,  0.1975],
        [ 0.0314,  0.2614]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2156,  0.3095],
        [-0.2499,  0.0850],
        [ 0.1384,  0.0712],
        [ 0.0413,  0.2566],
        [ 0.0167,  0.1526],
        [ 0.1442,  0.2404],
        [-0.1016,  0.1554],
        [ 0.0185,  0.1043],
        [ 0.0083,  0.1636],
        [ 0.0816,  0.1397],
        [-0.1806,  0.0513],
        [ 0.0948,  0.3137]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0463,  0.0697],
        [-0.1065, -0.0695],
        [-0.1623,  0.1697],
        [-0.0252,  0.2761],
        [ 0.0193,  0.2589],
        [ 0.2595, -0.0536],
        [-0.1066,  0.1762],
        [ 0.0632,  0.1754],
        [ 0.1060,  0.2319],
        [ 0.1823,  0.1825],
        [-0.1524,  0.3117],
        [-0.0350,  0.0901]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0247,  0.2102],
        [ 0.0534,  0.2353],
        [ 0.0884,  0.1202],
        [ 0.0405,  0.2438],
        [-0.0183,  0.0041],
        [ 0.1386,  0.2581],
        [-0.0062,  0.3322],
        [ 0.0318,  0.1653],
        [ 0.1472,  0.2385],
        [-0.1331,  0.1604],
        [-0.2140,  0.0603],
        [ 0.1266,  0.1638]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0788,  0.1824],
        [ 0.0571,  0.2411],
        [ 0.0257,  0.1032],
        [-0.0791,  0.2823],
        [ 0.1028,  0.1952],
        [ 0.0842,  0.2599],
        [-0.0809,  0.2050],
        [-0.1799,  0.2593],
        [-0.0612,  0.2745],
        [ 0.0871,  0.2610],
        [-0.0652,  0.2330],
        [ 0.1468,  0.2231]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0224,  0.2144],
        [-0.0858,  0.1927],
        [ 0.0427,  0.2297],
        [-0.0176,  0.1917],
        [ 0.0515,  0.1868],
        [ 0.1134,  0.1451],
        [-0.1522,  0.2071],
        [ 0.0232,  0.2064],
        [-0.0474,  0.2399],
        [-0.1159,  0.1963],
        [-0.0640,  0.1909],
        [-0.1781,  0.2352]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0281,  0.3039],
        [-0.0103,  0.1231],
        [ 0.0739,  0.1852],
        [ 0.0076,  0.1739],
        [-0.0429,  0.1915],
        [-0.0072,  0.0079],
        [-0.0380,  0.2983],
        [-0.0108, -0.0598],
        [-0.0617,  0.2105],
        [-0.0043,  0.3664],
        [-0.1248,  0.0956],
        [ 0.0837,  0.1515]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0241,  0.3100],
        [ 0.0716,  0.0670],
        [ 0.1602,  0.0243],
        [-0.0234,  0.1158],
        [ 0.1269,  0.1650],
        [ 0.1514, -0.0323],
        [-0.0783,  0.2432],
        [-0.0094,  0.3020],
        [ 0.0005,  0.1960],
        [-0.0007,  0.2788],
        [ 0.0253,  0.3189],
        [ 0.1265,  0.2176]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0073,  0.2381],
        [-0.0905,  0.2375],
        [-0.0897,  0.2756],
        [ 0.0355,  0.3025],
        [ 0.0336,  0.1788],
        [-0.0150,  0.2739],
        [ 0.0773,  0.2371],
        [-0.0241,  0.1283],
        [-0.1323,  0.2208],
        [ 0.0114,  0.1439],
        [ 0.0045,  0.1824],
        [ 0.0217,  0.3089]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0651,  0.3672],
        [-0.0247,  0.1865],
        [ 0.2419,  0.1371],
        [-0.0913,  0.1819],
        [-0.0668,  0.4095],
        [ 0.1673,  0.0784],
        [-0.1384,  0.1349],
        [ 0.1282,  0.2358],
        [-0.0205,  0.3012],
        [-0.0983,  0.1363],
        [-0.0656,  0.2833],
        [-0.1073,  0.2496]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0853,  0.1562],
        [-0.0715,  0.2160],
        [ 0.0149,  0.0769],
        [ 0.0657,  0.0890],
        [-0.0554,  0.2702],
        [-0.0251,  0.2563],
        [ 0.0182,  0.1644],
        [-0.1146,  0.2754],
        [ 0.0531,  0.1379],
        [-0.0275,  0.1916],
        [ 0.0503,  0.2633],
        [ 0.0908,  0.1176]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0593,  0.2357],
        [-0.0817,  0.1861],
        [-0.0422,  0.2556],
        [-0.1540,  0.1204],
        [ 0.2868,  0.1082],
        [ 0.0121,  0.2841],
        [-0.1067,  0.3118],
        [ 0.0660,  0.2268],
        [ 0.0061,  0.2012],
        [ 0.1697,  0.1934],
        [ 0.0561,  0.1809],
        [ 0.0382,  0.2756]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2691,  0.2543],
        [-0.0057,  0.1041],
        [ 0.0940,  0.2946],
        [ 0.0496,  0.1507],
        [-0.1329,  0.4062],
        [ 0.0283,  0.2784],
        [-0.2043,  0.3094],
        [-0.0332,  0.3086],
        [ 0.1503,  0.2117],
        [ 0.1760,  0.1790],
        [-0.0246,  0.2270],
        [ 0.0519,  0.2455]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.1010,  0.2435],
        [-0.0071,  0.1341],
        [-0.0919,  0.2003],
        [-0.1319,  0.2839],
        [ 0.2005,  0.2293],
        [ 0.1388,  0.0925],
        [-0.0621,  0.2576],
        [ 0.1345,  0.2565],
        [ 0.1003,  0.1271],
        [ 0.1266,  0.0879],
        [-0.2737,  0.2392],
        [-0.0839,  0.3180]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0624,  0.2075],
        [ 0.1687,  0.1282],
        [ 0.0696,  0.3544],
        [ 0.0331,  0.1773],
        [ 0.1455,  0.1064],
        [ 0.1136,  0.3258],
        [-0.2081,  0.1768],
        [-0.0101,  0.0663],
        [ 0.0710,  0.2128],
        [ 0.0071,  0.2640],
        [ 0.1686,  0.1747],
        [ 0.0463,  0.1516]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0455,  0.2214],
        [-0.0860,  0.1598],
        [-0.0011,  0.2753],
        [-0.1316,  0.2791],
        [ 0.0005,  0.3217],
        [-0.0045,  0.2915],
        [-0.0459,  0.1737],
        [-0.1774,  0.1035],
        [ 0.0343,  0.1997],
        [ 0.0733,  0.1715],
        [ 0.0597,  0.1965],
        [ 0.1187,  0.1169]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0739,  0.1702],
        [ 0.0645,  0.2061],
        [-0.1080,  0.2912],
        [ 0.1859,  0.1946],
        [ 0.1675,  0.2777],
        [ 0.2067,  0.1714],
        [-0.0085,  0.1944],
        [ 0.0596,  0.2748],
        [ 0.0085,  0.1647],
        [ 0.0943,  0.1955],
        [-0.0178,  0.2227],
        [-0.0859,  0.3163]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0282,  0.2243],
        [ 0.0797,  0.0781],
        [-0.0867,  0.2003],
        [ 0.0941,  0.1612],
        [ 0.0499,  0.3163],
        [ 0.0197,  0.0966],
        [ 0.0912,  0.3975],
        [ 0.0917,  0.1203],
        [-0.0552,  0.3105],
        [ 0.0806,  0.2901],
        [-0.0769,  0.1383],
        [-0.0367,  0.3873]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0706,  0.2418],
        [-0.1597,  0.2330],
        [ 0.0027,  0.1450],
        [-0.0265,  0.2525],
        [ 0.1014,  0.2126],
        [ 0.0747, -0.0009],
        [ 0.0204,  0.1422],
        [-0.1461,  0.3655],
        [ 0.0867,  0.3057],
        [ 0.0131,  0.2181],
        [-0.1625,  0.3228],
        [-0.0034,  0.1602]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0833,  0.1854],
        [-0.2220,  0.2378],
        [-0.1129,  0.2482],
        [-0.0235,  0.3255],
        [-0.1514,  0.1336],
        [ 0.0099,  0.1201],
        [-0.0651,  0.0695],
        [ 0.0541,  0.1054],
        [ 0.1490,  0.1803],
        [-0.0785,  0.2906],
        [ 0.0053,  0.3050],
        [-0.1279,  0.3952]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0137,  0.2008],
        [-0.0292,  0.0785],
        [ 0.2372,  0.1876],
        [ 0.0299,  0.2506],
        [-0.2007,  0.2932],
        [ 0.0307,  0.1427],
        [-0.0027,  0.2321],
        [-0.0067,  0.2927],
        [ 0.0134,  0.1232],
        [ 0.1001,  0.2512],
        [-0.0709,  0.1942],
        [-0.0067,  0.1846]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1141,  0.1005],
        [ 0.0155,  0.1597],
        [ 0.0058,  0.2634],
        [ 0.0444,  0.2256],
        [-0.0890,  0.2303],
        [ 0.0714,  0.2117],
        [-0.2052,  0.3095],
        [ 0.0585,  0.2711],
        [-0.0470,  0.1424],
        [ 0.1292,  0.0872],
        [ 0.1135,  0.0736],
        [ 0.2000,  0.1739]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0138,  0.2489],
        [-0.0380,  0.3109],
        [-0.1089,  0.3100],
        [ 0.0808,  0.3112],
        [ 0.1516,  0.2042],
        [ 0.0513,  0.2297],
        [-0.1038,  0.3226],
        [-0.0309,  0.1587],
        [-0.1324,  0.0587],
        [-0.0106,  0.1022],
        [-0.0524,  0.1829],
        [ 0.0666,  0.2550]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0576,  0.1536],
        [ 0.0011,  0.0406],
        [ 0.0812,  0.1173],
        [ 0.0601,  0.1816],
        [-0.0456,  0.0607],
        [ 0.0432,  0.1623],
        [-0.1158,  0.1778],
        [ 0.1283,  0.1160],
        [ 0.1002,  0.1153],
        [ 0.0675,  0.1847],
        [-0.1047,  0.1849],
        [ 0.1611,  0.2550]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.1531,  0.1755],
        [-0.0628,  0.0325],
        [-0.0748,  0.2171],
        [-0.2360,  0.4695],
        [ 0.0249,  0.2002],
        [ 0.0743,  0.1169],
        [ 0.0658,  0.1428],
        [ 0.1730,  0.0440],
        [ 0.0904,  0.1212],
        [ 0.1184,  0.2422],
        [-0.1121,  0.3098],
        [ 0.0823,  0.2131]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-6.8271e-02,  2.4695e-01],
        [-1.2773e-04,  2.9850e-01],
        [ 4.9710e-02,  2.5094e-01],
        [ 1.3903e-01,  2.3111e-01],
        [ 2.3868e-01, -4.4995e-03],
        [ 1.4525e-02,  3.5069e-01],
        [-1.4407e-01,  1.6393e-01],
        [ 1.4072e-01,  4.7786e-02],
        [ 1.4091e-01,  1.3365e-01],
        [ 1.4424e-02,  7.6798e-02],
        [-4.3171e-04,  1.5804e-01],
        [ 8.0534e-02,  1.7919e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0992,  0.0686],
        [ 0.0003,  0.2125],
        [ 0.0035,  0.3054],
        [ 0.0363,  0.1878],
        [ 0.0263,  0.2932],
        [ 0.0296,  0.1970],
        [-0.0926,  0.2899],
        [-0.1169,  0.1898],
        [ 0.0026,  0.1821],
        [ 0.0072,  0.2170],
        [ 0.0374,  0.2867],
        [ 0.2783,  0.1289]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0249,  0.0185],
        [ 0.1083,  0.1520],
        [-0.1296,  0.3167],
        [ 0.1339,  0.0167],
        [ 0.1768,  0.2456],
        [ 0.2327,  0.1312],
        [-0.2011,  0.2431],
        [ 0.0930,  0.1762],
        [ 0.0571,  0.1369],
        [ 0.1253,  0.2445],
        [ 0.0912,  0.2259],
        [ 0.0529,  0.0005]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0555,  0.2940],
        [ 0.1552,  0.1372],
        [ 0.0071,  0.0849],
        [ 0.0181,  0.3410],
        [-0.0106,  0.3541],
        [ 0.2385,  0.0700],
        [-0.1239,  0.3972],
        [ 0.1241,  0.0346],
        [-0.1002,  0.1617],
        [-0.0940,  0.4274],
        [-0.1856,  0.3224],
        [ 0.1253,  0.1401]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0089,  0.1330],
        [-0.0733,  0.2688],
        [ 0.0164,  0.1233],
        [ 0.1651,  0.0762],
        [ 0.0386,  0.1733],
        [ 0.1079,  0.0710],
        [ 0.0634,  0.0963],
        [-0.2274,  0.1686],
        [ 0.1780,  0.2656],
        [ 0.0857,  0.1489],
        [ 0.0707,  0.2930],
        [ 0.1231,  0.0313]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0559,  0.2691],
        [ 0.1317,  0.2173],
        [ 0.0042,  0.2846],
        [ 0.0156,  0.1883],
        [-0.0606,  0.1961],
        [-0.0138,  0.1782],
        [ 0.1340,  0.0767],
        [ 0.1930,  0.0874],
        [-0.0402,  0.1478],
        [ 0.0089,  0.1189],
        [ 0.1685,  0.1585],
        [ 0.0834,  0.2029]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0939,  0.0094],
        [-0.0338,  0.0863],
        [ 0.2420,  0.1280],
        [ 0.0039,  0.2093],
        [-0.0134,  0.2370],
        [ 0.0848,  0.2489],
        [-0.1336,  0.2782],
        [ 0.0741,  0.2192],
        [ 0.1092,  0.2043],
        [ 0.0161,  0.2238],
        [ 0.1049,  0.1986],
        [ 0.0460,  0.1904]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0175,  0.2718],
        [ 0.0453,  0.0542],
        [-0.0022,  0.1250],
        [-0.0225,  0.2403],
        [ 0.1420,  0.1748],
        [ 0.1704,  0.1475],
        [ 0.0305,  0.2916],
        [-0.0102,  0.1566],
        [-0.0209,  0.1013],
        [-0.0158,  0.1755],
        [ 0.1577,  0.1038],
        [ 0.2966, -0.0532]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0661,  0.0753],
        [-0.0344,  0.2649],
        [ 0.0805,  0.1311],
        [-0.0175,  0.2290],
        [ 0.0231,  0.1524],
        [ 0.1320,  0.1476],
        [ 0.1055,  0.2438],
        [-0.0253,  0.1361],
        [ 0.0981,  0.1876],
        [ 0.1116,  0.1593],
        [ 0.0464,  0.2680],
        [-0.0213,  0.4855]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0208,  0.2197],
        [-0.0160, -0.0602],
        [ 0.1157,  0.0910],
        [ 0.0762,  0.0730],
        [ 0.1786,  0.1352],
        [ 0.1138,  0.1521],
        [-0.0274,  0.2540],
        [ 0.0517,  0.0678],
        [ 0.2302,  0.1081],
        [ 0.1329, -0.0025],
        [ 0.0393,  0.1297],
        [ 0.1464,  0.1332]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0719,  0.1972],
        [ 0.0644, -0.1107],
        [-0.0249,  0.1220],
        [-0.1298,  0.3262],
        [ 0.1327,  0.2506],
        [ 0.2971,  0.1031],
        [-0.0049,  0.2468],
        [ 0.1104,  0.1349],
        [ 0.1721,  0.1984],
        [ 0.1197,  0.1211],
        [-0.2373,  0.2160],
        [ 0.2142,  0.1202]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0500,  0.2425],
        [ 0.0287,  0.1364],
        [-0.0542,  0.2013],
        [ 0.0520,  0.3638],
        [ 0.2209,  0.2366],
        [ 0.0009,  0.3050],
        [-0.1370,  0.2054],
        [ 0.0326, -0.0038],
        [-0.0244,  0.3190],
        [-0.0756,  0.1788],
        [ 0.1401,  0.0097],
        [ 0.1622,  0.0825]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0771,  0.2280],
        [ 0.1092,  0.1452],
        [ 0.1491,  0.2891],
        [ 0.0350,  0.1732],
        [ 0.0752,  0.2251],
        [-0.0345,  0.2616],
        [-0.1818,  0.1731],
        [-0.1055,  0.2478],
        [ 0.0955,  0.2235],
        [ 0.0757,  0.2320],
        [ 0.0288,  0.2235],
        [ 0.1184,  0.1651]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0492,  0.1842],
        [ 0.1167, -0.0291],
        [ 0.1255,  0.2591],
        [-0.0501,  0.2430],
        [ 0.1036,  0.2357],
        [ 0.2838,  0.0028],
        [-0.2270,  0.1531],
        [ 0.0154,  0.0942],
        [ 0.0374,  0.2219],
        [ 0.0799,  0.1788],
        [ 0.0472,  0.1058],
        [ 0.1835,  0.1962]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1052,  0.0907],
        [ 0.0641,  0.1769],
        [ 0.1225,  0.2987],
        [ 0.1300,  0.1073],
        [ 0.1279,  0.0845],
        [ 0.1638,  0.0938],
        [-0.0246,  0.2819],
        [ 0.0284,  0.1137],
        [-0.0027,  0.1370],
        [-0.1420,  0.3344],
        [ 0.0112,  0.1430],
        [-0.0286,  0.2702]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0331,  0.3178],
        [-0.0029,  0.0757],
        [ 0.1562,  0.1713],
        [ 0.1381,  0.1041],
        [ 0.2241,  0.1610],
        [ 0.0103,  0.1759],
        [ 0.0009,  0.0977],
        [-0.0194,  0.3138],
        [-0.0131,  0.3374],
        [ 0.0552,  0.2885],
        [-0.0116,  0.1977],
        [ 0.0704,  0.1491]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0020,  0.2816],
        [-0.0535,  0.2490],
        [ 0.0544,  0.2660],
        [-0.0245,  0.2965],
        [ 0.0877,  0.1872],
        [ 0.0875,  0.1195],
        [ 0.1092,  0.0920],
        [ 0.1061,  0.1573],
        [ 0.0591,  0.0969],
        [-0.0202,  0.1348],
        [ 0.0153,  0.1630],
        [-0.0119,  0.1336]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.1087,  0.1602],
        [-0.0535,  0.1994],
        [ 0.2063,  0.0886],
        [ 0.0682,  0.0757],
        [-0.1291,  0.2111],
        [ 0.1696,  0.1142],
        [-0.1063,  0.1513],
        [ 0.1288,  0.1084],
        [ 0.0361,  0.2408],
        [ 0.1391,  0.0575],
        [-0.0440,  0.2706],
        [ 0.0847,  0.0900]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1109,  0.1714],
        [-0.0269,  0.1422],
        [ 0.2454,  0.0798],
        [-0.0733,  0.1308],
        [-0.0151,  0.0985],
        [ 0.0453,  0.1008],
        [ 0.0167,  0.3237],
        [-0.0272,  0.1153],
        [-0.0797,  0.0165],
        [ 0.1702,  0.1392],
        [ 0.0300,  0.1239],
        [ 0.2743,  0.0210]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.1037,  0.1476],
        [-0.0916,  0.3258],
        [-0.0663,  0.1869],
        [ 0.0640,  0.0678],
        [ 0.0143,  0.1941],
        [ 0.0035,  0.1918],
        [-0.0211,  0.2596],
        [ 0.0996,  0.1332],
        [ 0.0810,  0.0630],
        [ 0.0170,  0.1645],
        [-0.0966,  0.2847],
        [-0.1065,  0.3506]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1087,  0.2167],
        [ 0.0405, -0.0179],
        [ 0.1495,  0.0586],
        [ 0.1636,  0.0660],
        [ 0.1176,  0.1102],
        [ 0.2141,  0.1321],
        [ 0.0147,  0.1398],
        [ 0.0567,  0.0150],
        [ 0.1703,  0.2360],
        [ 0.1357,  0.1647],
        [ 0.0146,  0.2033],
        [ 0.2551,  0.2318]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0197,  0.1996],
        [-0.0703,  0.1045],
        [-0.0206,  0.0548],
        [-0.1560,  0.2278],
        [ 0.1337,  0.0137],
        [ 0.1193,  0.0676],
        [ 0.0885,  0.2234],
        [ 0.0157,  0.2191],
        [ 0.1377,  0.1519],
        [ 0.1857,  0.0289],
        [-0.0479,  0.2508],
        [ 0.1722,  0.0749]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.2619,  0.3257],
        [ 0.1480,  0.0422],
        [ 0.0857,  0.2406],
        [ 0.0701,  0.2713],
        [ 0.1513,  0.1704],
        [ 0.0324,  0.2677],
        [-0.0163,  0.2126],
        [ 0.2959,  0.0938],
        [ 0.0573,  0.2168],
        [-0.0507,  0.2730],
        [-0.0567,  0.2722],
        [ 0.0196,  0.1633]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0162,  0.2027],
        [ 0.0940,  0.0792],
        [ 0.0536,  0.1266],
        [-0.1298,  0.1994],
        [ 0.0576,  0.2155],
        [-0.0233,  0.3718],
        [-0.0431,  0.3019],
        [-0.0134,  0.2264],
        [ 0.0785,  0.3873],
        [ 0.1187,  0.0928],
        [-0.1219,  0.2618],
        [ 0.1119,  0.0990]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0870,  0.1367],
        [-0.0930,  0.2743],
        [-0.1596,  0.1961],
        [-0.1116,  0.2108],
        [ 0.1092,  0.2289],
        [ 0.2098,  0.1490],
        [-0.2569,  0.2793],
        [-0.1381,  0.3777],
        [-0.0108,  0.2371],
        [ 0.0696,  0.2232],
        [-0.0428,  0.2545],
        [-0.0395,  0.2136]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0139,  0.1639],
        [-0.0444,  0.2431],
        [ 0.0776,  0.2005],
        [ 0.0181,  0.3021],
        [ 0.0766,  0.1959],
        [ 0.1924,  0.2703],
        [-0.0807,  0.3006],
        [ 0.0299,  0.0420],
        [ 0.0847,  0.2836],
        [ 0.0198,  0.3121],
        [-0.0818,  0.2267],
        [ 0.1366,  0.2730]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0042,  0.1912],
        [ 0.0089,  0.1724],
        [ 0.1383,  0.1978],
        [ 0.2142,  0.1544],
        [ 0.1302,  0.1492],
        [ 0.0526,  0.0474],
        [-0.0679,  0.1605],
        [-0.1681,  0.4032],
        [ 0.0303,  0.3721],
        [-0.0678,  0.2129],
        [ 0.1592,  0.1908],
        [ 0.0644,  0.1637]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0245,  0.0774],
        [-0.2152,  0.1031],
        [-0.1715,  0.2362],
        [-0.1668,  0.4346],
        [-0.0198,  0.0857],
        [-0.0965,  0.1479],
        [ 0.0492,  0.0954],
        [ 0.1192,  0.0871],
        [ 0.0804,  0.2146],
        [ 0.0720,  0.1067],
        [ 0.0660,  0.1403],
        [ 0.0724,  0.2676]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0802,  0.1567],
        [-0.1814,  0.2383],
        [ 0.0136,  0.0591],
        [ 0.0127,  0.2408],
        [-0.0283,  0.3742],
        [ 0.0071,  0.3356],
        [-0.0799,  0.1847],
        [ 0.1375,  0.1403],
        [ 0.0004,  0.1039],
        [ 0.0531,  0.3178],
        [-0.1220,  0.2797],
        [-0.0513,  0.1645]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0207,  0.1456],
        [ 0.1444,  0.1397],
        [ 0.1488,  0.2010],
        [-0.0846,  0.2679],
        [ 0.0428,  0.1903],
        [ 0.0803,  0.1775],
        [ 0.0015,  0.2330],
        [-0.0087,  0.0981],
        [-0.0453,  0.0796],
        [ 0.0541,  0.1983],
        [ 0.1515,  0.1165],
        [ 0.1229, -0.0637]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 2.2026e-02,  2.2364e-01],
        [-3.8576e-02,  4.9745e-01],
        [-3.8143e-02,  2.8329e-01],
        [-8.4464e-05,  9.1259e-02],
        [ 2.1668e-01,  3.7158e-02],
        [ 3.7129e-02,  9.9961e-02],
        [-8.7018e-03,  2.8622e-01],
        [ 2.6369e-02,  1.5912e-01],
        [ 1.1492e-01,  2.1861e-01],
        [ 1.0997e-01,  2.8190e-01],
        [ 3.2331e-02,  1.9641e-01],
        [ 1.8180e-02,  2.1227e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0918,  0.1862],
        [-0.0128,  0.1278],
        [ 0.0509,  0.1685],
        [ 0.0976,  0.1336],
        [ 0.0366,  0.1470],
        [ 0.0397,  0.1130],
        [-0.2486,  0.2378],
        [-0.0039,  0.0907],
        [ 0.1388,  0.2762],
        [ 0.2114,  0.1111],
        [ 0.0305,  0.2406],
        [ 0.2389,  0.1066]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0365,  0.3240],
        [-0.1703, -0.0054],
        [ 0.0059,  0.2018],
        [-0.0873,  0.3290],
        [ 0.0595,  0.1828],
        [ 0.3401, -0.0350],
        [ 0.0259,  0.1835],
        [ 0.1560,  0.0645],
        [ 0.0754,  0.2309],
        [ 0.2985,  0.1535],
        [-0.2215,  0.3595],
        [-0.1160,  0.2378]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0709,  0.2405],
        [ 0.0997,  0.0717],
        [ 0.0428,  0.1594],
        [ 0.1182,  0.1920],
        [ 0.1921,  0.0635],
        [ 0.0033,  0.2826],
        [ 0.0055,  0.2572],
        [ 0.1851, -0.0091],
        [ 0.0067,  0.2388],
        [ 0.1644,  0.1777],
        [ 0.0014,  0.2931],
        [ 0.1373,  0.0396]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0009,  0.1832],
        [ 0.1467,  0.1473],
        [ 0.0989,  0.1214],
        [-0.1064,  0.1889],
        [ 0.0466,  0.2736],
        [ 0.0401,  0.1930],
        [ 0.0595,  0.1543],
        [ 0.0228,  0.0854],
        [ 0.0169,  0.2438],
        [ 0.0665,  0.3045],
        [ 0.1449,  0.1845],
        [ 0.1640,  0.0286]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0191,  0.2233],
        [-0.0390,  0.2186],
        [-0.1510,  0.3625],
        [-0.0450,  0.2842],
        [ 0.2156,  0.2797],
        [ 0.1274,  0.1080],
        [-0.4223,  0.3750],
        [-0.0397,  0.1841],
        [ 0.0417,  0.1764],
        [ 0.0401,  0.3240],
        [-0.1105,  0.2714],
        [ 0.0844,  0.1387]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0774,  0.0746],
        [ 0.0531,  0.3422],
        [ 0.0294,  0.3875],
        [ 0.0633,  0.1872],
        [ 0.0680,  0.3567],
        [ 0.0868,  0.0579],
        [ 0.1045,  0.1827],
        [ 0.0979,  0.0932],
        [ 0.0406,  0.1353],
        [-0.1565,  0.3418],
        [-0.1540,  0.1802],
        [ 0.0842,  0.0480]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0077,  0.2037],
        [-0.0637,  0.2021],
        [ 0.0919,  0.2390],
        [ 0.1062,  0.1626],
        [ 0.1346,  0.1089],
        [ 0.1231,  0.0790],
        [-0.0158,  0.2560],
        [-0.0927,  0.3893],
        [ 0.0802,  0.2027],
        [-0.0410,  0.2737],
        [-0.0190,  0.1030],
        [ 0.1378,  0.1782]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0257,  0.2068],
        [ 0.0840,  0.1960],
        [ 0.1022,  0.0650],
        [-0.1650,  0.2838],
        [ 0.1462,  0.0211],
        [ 0.1591,  0.1070],
        [ 0.2102, -0.0399],
        [ 0.0666,  0.1742],
        [ 0.0890,  0.0770],
        [-0.1419,  0.2917],
        [ 0.1781,  0.1626],
        [ 0.0210,  0.2334]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0430,  0.0815],
        [ 0.0050,  0.2622],
        [ 0.2310,  0.0079],
        [-0.0075,  0.1223],
        [-0.0761,  0.3729],
        [ 0.1343,  0.1647],
        [-0.0877,  0.2196],
        [ 0.1249,  0.0787],
        [ 0.1350,  0.0742],
        [-0.0436,  0.1891],
        [-0.0186,  0.1066],
        [ 0.1338,  0.2243]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0684,  0.2127],
        [-0.0177,  0.1500],
        [ 0.2797,  0.1333],
        [ 0.0849,  0.1805],
        [-0.1716,  0.2012],
        [-0.0064,  0.1801],
        [-0.1534,  0.2648],
        [-0.0450,  0.2257],
        [ 0.0334,  0.0800],
        [ 0.1063,  0.1693],
        [ 0.0841,  0.1507],
        [ 0.2563, -0.0615]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0681,  0.1356],
        [ 0.0393,  0.2719],
        [-0.0468,  0.2187],
        [ 0.1125,  0.0395],
        [ 0.2124,  0.1110],
        [ 0.1649,  0.0530],
        [ 0.0528,  0.1653],
        [-0.0223,  0.2093],
        [ 0.0218,  0.3189],
        [ 0.0840,  0.2253],
        [ 0.0841,  0.1695],
        [ 0.0599,  0.2544]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0223,  0.1242],
        [-0.0329,  0.2333],
        [ 0.0811,  0.1994],
        [ 0.0790,  0.1890],
        [ 0.0482,  0.0683],
        [ 0.1876,  0.1644],
        [-0.0139,  0.3202],
        [ 0.1897, -0.0696],
        [ 0.0883,  0.1095],
        [ 0.2893,  0.1674],
        [ 0.0699,  0.1998],
        [ 0.0135,  0.3197]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0071,  0.2397],
        [-0.1068,  0.1334],
        [-0.0375,  0.0051],
        [-0.0844,  0.3690],
        [-0.0681,  0.3616],
        [ 0.2794, -0.0603],
        [-0.0705,  0.4048],
        [ 0.0720,  0.1923],
        [ 0.1561,  0.2508],
        [ 0.0676,  0.3383],
        [-0.1925,  0.3575],
        [ 0.0854,  0.0830]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1374,  0.0773],
        [ 0.0697,  0.0866],
        [ 0.0199,  0.2989],
        [ 0.1026,  0.3170],
        [ 0.0326,  0.1440],
        [-0.0766,  0.3850],
        [-0.1104,  0.1857],
        [ 0.0807,  0.1593],
        [ 0.0640,  0.2506],
        [-0.0414,  0.0919],
        [ 0.0593,  0.2772],
        [ 0.0734,  0.1276]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0472,  0.3278],
        [ 0.0053,  0.1188],
        [ 0.0118,  0.2361],
        [ 0.0994,  0.2364],
        [ 0.0290,  0.2921],
        [-0.0118,  0.3400],
        [-0.0559,  0.1272],
        [-0.0285,  0.2517],
        [ 0.0062,  0.3027],
        [ 0.0184,  0.1535],
        [-0.2765,  0.2743],
        [ 0.1813,  0.0466]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1330,  0.2182],
        [-0.0684,  0.2911],
        [-0.1221,  0.3906],
        [-0.0452,  0.1667],
        [ 0.1437,  0.3015],
        [ 0.2401,  0.1355],
        [-0.1565,  0.2878],
        [-0.1081,  0.3064],
        [ 0.0390,  0.2175],
        [-0.0998,  0.3023],
        [-0.0494,  0.2352],
        [ 0.0381,  0.2094]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0903,  0.2719],
        [-0.0902,  0.2335],
        [-0.0129,  0.1631],
        [-0.0417,  0.3615],
        [-0.0045,  0.2057],
        [ 0.1375,  0.0230],
        [-0.0018,  0.2421],
        [ 0.0634,  0.0809],
        [-0.1727,  0.4102],
        [-0.1824,  0.2600],
        [ 0.0080,  0.2675],
        [-0.0842,  0.3741]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0195,  0.2162],
        [ 0.0690,  0.0164],
        [-0.0038,  0.1546],
        [ 0.1075,  0.1295],
        [-0.0192,  0.2555],
        [ 0.0667,  0.1198],
        [ 0.1174,  0.1717],
        [-0.1383,  0.2490],
        [ 0.0132,  0.2887],
        [ 0.0104,  0.2833],
        [ 0.0065,  0.1532],
        [ 0.0669,  0.2758]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1678,  0.1752],
        [-0.0152,  0.1978],
        [ 0.1204,  0.0771],
        [-0.1540,  0.2621],
        [ 0.1182,  0.0422],
        [ 0.2330,  0.0823],
        [ 0.1010,  0.1211],
        [ 0.0779,  0.2182],
        [ 0.1489,  0.0997],
        [ 0.0679,  0.1579],
        [-0.0564,  0.3383],
        [-0.1226,  0.2818]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0064,  0.0999],
        [ 0.0034,  0.2526],
        [ 0.2099,  0.1869],
        [ 0.0091,  0.1698],
        [-0.1214,  0.2208],
        [ 0.0457,  0.2396],
        [-0.0662,  0.2941],
        [ 0.0924,  0.2078],
        [ 0.0744, -0.0157],
        [ 0.0010,  0.1948],
        [-0.0546,  0.2270],
        [-0.0711,  0.2297]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0432,  0.0581],
        [ 0.1018,  0.0624],
        [ 0.0946,  0.1573],
        [ 0.0809,  0.2264],
        [-0.1697,  0.3646],
        [ 0.0009,  0.2205],
        [-0.1052,  0.1875],
        [-0.1424,  0.2692],
        [-0.0169,  0.1707],
        [-0.0714,  0.1486],
        [-0.0531,  0.2366],
        [ 0.2068,  0.0812]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0217,  0.2757],
        [-0.0581,  0.3013],
        [-0.1584,  0.2386],
        [-0.0259,  0.2057],
        [ 0.0852,  0.0951],
        [ 0.0510,  0.2180],
        [ 0.0290,  0.2905],
        [ 0.0566,  0.1297],
        [ 0.1915,  0.1883],
        [ 0.0545,  0.2226],
        [-0.1592,  0.2013],
        [-0.0413,  0.2439]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0888,  0.1549],
        [-0.2414,  0.1055],
        [ 0.1565,  0.1336],
        [ 0.1152,  0.1822],
        [-0.0818,  0.1174],
        [-0.0220,  0.1866],
        [-0.3086,  0.3836],
        [-0.1323,  0.2366],
        [ 0.0513,  0.1333],
        [ 0.1412,  0.0337],
        [ 0.0480,  0.2455],
        [ 0.1021,  0.1205]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0048,  0.2401],
        [-0.0935,  0.0838],
        [ 0.1002,  0.0598],
        [-0.3239,  0.5020],
        [ 0.0795,  0.2865],
        [ 0.0863,  0.1868],
        [ 0.0749,  0.3092],
        [ 0.0848,  0.0597],
        [ 0.0785,  0.2933],
        [ 0.2401,  0.1419],
        [-0.2732,  0.3240],
        [-0.0010,  0.1998]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 1.1232e-01,  2.1577e-01],
        [-7.4040e-02,  1.5202e-01],
        [-7.8155e-02,  3.6382e-01],
        [ 1.7361e-01,  1.1840e-01],
        [ 6.9127e-02,  1.9000e-01],
        [ 2.5831e-04,  2.7282e-01],
        [ 1.1194e-01,  1.7920e-01],
        [ 3.4246e-02,  1.3284e-01],
        [-4.7283e-02,  2.3496e-01],
        [ 6.2706e-02,  1.4310e-01],
        [ 2.5976e-02,  2.1277e-01],
        [ 1.2303e-01,  1.3638e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0027,  0.2025],
        [ 0.1236,  0.1372],
        [ 0.0130,  0.2955],
        [-0.1182,  0.2350],
        [ 0.0593,  0.2854],
        [-0.0517,  0.1975],
        [-0.1777,  0.3318],
        [-0.1579,  0.2683],
        [ 0.0300,  0.2319],
        [ 0.0166,  0.1704],
        [-0.0526,  0.2593],
        [ 0.1002,  0.0685]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1438,  0.2064],
        [-0.0984,  0.3312],
        [-0.0570,  0.2388],
        [-0.0890,  0.2875],
        [ 0.1464,  0.1194],
        [ 0.1741,  0.1314],
        [-0.3570,  0.3286],
        [ 0.0220,  0.1907],
        [ 0.0724,  0.1600],
        [-0.0036,  0.3152],
        [-0.0316,  0.3017],
        [ 0.0981,  0.1059]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1764,  0.0642],
        [-0.1151,  0.3052],
        [ 0.1646,  0.1792],
        [ 0.0917,  0.1120],
        [ 0.1451,  0.1402],
        [ 0.1334,  0.1296],
        [-0.1809,  0.3158],
        [ 0.1515,  0.1381],
        [-0.0367,  0.2822],
        [-0.1182,  0.2455],
        [-0.0097,  0.0972],
        [ 0.1461,  0.1642]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.2384,  0.2325],
        [ 0.1875,  0.1246],
        [ 0.1009, -0.0699],
        [ 0.1683,  0.1075],
        [ 0.1085,  0.0712],
        [ 0.2690, -0.0625],
        [-0.0313,  0.3102],
        [-0.0838,  0.2130],
        [ 0.1207,  0.2365],
        [-0.0208,  0.3068],
        [ 0.0506,  0.2326],
        [-0.0320,  0.1701]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1750,  0.3265],
        [-0.0449,  0.1880],
        [ 0.1305,  0.0623],
        [-0.0835,  0.2191],
        [ 0.0930,  0.0788],
        [ 0.1659,  0.0720],
        [ 0.1353,  0.0666],
        [ 0.0472,  0.1375],
        [ 0.0786,  0.1853],
        [ 0.1803, -0.0576],
        [ 0.0465,  0.2638],
        [-0.1416,  0.2974]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0447,  0.2841],
        [-0.0531,  0.1362],
        [ 0.2039,  0.1009],
        [-0.0351,  0.3694],
        [ 0.0304,  0.2400],
        [-0.0339,  0.1687],
        [-0.0422,  0.1936],
        [-0.0129,  0.1291],
        [ 0.1477,  0.0146],
        [ 0.0140,  0.1505],
        [ 0.0315,  0.1804],
        [ 0.1982,  0.1168]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0766,  0.0329],
        [ 0.0756,  0.0380],
        [ 0.2037,  0.0512],
        [ 0.0893,  0.1083],
        [ 0.0071,  0.1055],
        [ 0.0225,  0.2155],
        [ 0.0693,  0.1516],
        [-0.0571,  0.1692],
        [ 0.0835,  0.2754],
        [ 0.1236, -0.0635],
        [ 0.1777,  0.1268],
        [ 0.4013, -0.1011]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0777,  0.0184],
        [ 0.0140,  0.0619],
        [-0.0187,  0.1287],
        [-0.0029,  0.2617],
        [ 0.1085,  0.2165],
        [-0.0934,  0.1468],
        [-0.0374,  0.1944],
        [ 0.0208,  0.2242],
        [ 0.2720, -0.0167],
        [-0.0078,  0.2071],
        [ 0.0232,  0.3109],
        [ 0.1656,  0.2613]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1174,  0.1871],
        [-0.0219,  0.1567],
        [ 0.0650,  0.1867],
        [ 0.1385,  0.2399],
        [-0.1450,  0.2677],
        [ 0.1171,  0.1024],
        [-0.0584,  0.3661],
        [-0.0667,  0.1096],
        [ 0.1268,  0.0839],
        [ 0.1989, -0.1242],
        [ 0.0899,  0.1377],
        [ 0.0539,  0.1239]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.1041,  0.2364],
        [ 0.1192,  0.0273],
        [ 0.1575,  0.1204],
        [-0.0658,  0.2172],
        [ 0.0570,  0.1745],
        [ 0.2479, -0.0226],
        [ 0.0059,  0.2224],
        [ 0.2620,  0.0096],
        [ 0.2553,  0.1113],
        [ 0.1809,  0.0729],
        [-0.1252,  0.2004],
        [ 0.2639,  0.2060]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1267,  0.2265],
        [-0.0476,  0.0208],
        [ 0.0511,  0.1599],
        [ 0.1445,  0.0377],
        [ 0.1947,  0.1181],
        [ 0.0069,  0.2733],
        [-0.0894,  0.3441],
        [ 0.0778,  0.0488],
        [-0.0250,  0.2135],
        [ 0.0539,  0.1329],
        [-0.0652,  0.1105],
        [-0.0091,  0.1858]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.1298,  0.0288],
        [ 0.2086,  0.0621],
        [ 0.0554,  0.1293],
        [ 0.1103, -0.1010],
        [ 0.0644,  0.1457],
        [-0.0272,  0.2635],
        [-0.0585,  0.0871],
        [ 0.0016,  0.2198],
        [ 0.1530,  0.1720],
        [ 0.0536,  0.1554],
        [ 0.1179,  0.1166],
        [ 0.3280,  0.0346]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0617,  0.1037],
        [ 0.0964,  0.0796],
        [-0.1301,  0.2524],
        [ 0.0429,  0.1927],
        [ 0.1671,  0.2125],
        [ 0.1334, -0.0162],
        [-0.1902,  0.1808],
        [-0.0014,  0.1263],
        [ 0.1341,  0.0981],
        [ 0.1207,  0.2447],
        [ 0.0301,  0.1621],
        [ 0.0285,  0.2114]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1523,  0.1571],
        [ 0.0165,  0.1916],
        [ 0.0632,  0.0860],
        [ 0.1449,  0.2407],
        [ 0.0469,  0.1102],
        [ 0.1142,  0.0313],
        [ 0.0071,  0.2263],
        [ 0.0376,  0.1434],
        [ 0.1656,  0.2218],
        [ 0.0711,  0.2557],
        [-0.0088,  0.0298],
        [ 0.0524,  0.1995]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0945,  0.2081],
        [-0.0788,  0.1081],
        [ 0.0609,  0.1088],
        [-0.0382,  0.1051],
        [ 0.2150,  0.0981],
        [ 0.2031,  0.0757],
        [ 0.0270,  0.0565],
        [ 0.0886,  0.1119],
        [-0.0272,  0.3877],
        [ 0.2023,  0.1949],
        [ 0.1129,  0.0736],
        [-0.1316,  0.3206]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0329,  0.2842],
        [ 0.0356,  0.2423],
        [ 0.1252,  0.1810],
        [-0.0926,  0.3862],
        [ 0.1004,  0.0628],
        [ 0.0620,  0.0819],
        [ 0.0668,  0.0395],
        [-0.0546,  0.1977],
        [-0.0580,  0.2505],
        [ 0.0197,  0.1648],
        [-0.0009,  0.2556],
        [-0.0941,  0.3573]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0934,  0.1170],
        [-0.0509,  0.1640],
        [ 0.0764,  0.0446],
        [ 0.0715,  0.3261],
        [-0.1153,  0.1589],
        [ 0.1525,  0.0601],
        [-0.0080,  0.0424],
        [ 0.1180,  0.2003],
        [ 0.1257,  0.1139],
        [-0.0179,  0.2090],
        [-0.0406,  0.2854],
        [ 0.1669,  0.1613]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0042,  0.1671],
        [ 0.1288,  0.2757],
        [ 0.0614,  0.1794],
        [ 0.1125,  0.0660],
        [-0.0495,  0.2307],
        [ 0.0509,  0.1323],
        [ 0.0082,  0.1666],
        [-0.0749,  0.2057],
        [-0.0130,  0.2517],
        [ 0.0574,  0.0994],
        [ 0.2419,  0.0191],
        [ 0.2431, -0.0050]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.1323,  0.0485],
        [-0.0751,  0.3498],
        [ 0.0211,  0.0532],
        [ 0.0055,  0.0956],
        [ 0.2058,  0.0091],
        [ 0.1482,  0.0142],
        [-0.0908,  0.1842],
        [-0.0332,  0.1211],
        [ 0.1683, -0.0229],
        [ 0.0568,  0.0899],
        [ 0.1080,  0.2093],
        [ 0.0715,  0.2326]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1575,  0.2470],
        [-0.1654,  0.1869],
        [ 0.0737,  0.0893],
        [ 0.2010, -0.0130],
        [-0.1485,  0.1924],
        [ 0.0571,  0.3088],
        [-0.0827,  0.1167],
        [ 0.1272,  0.0528],
        [ 0.2379,  0.0116],
        [ 0.2102,  0.0407],
        [ 0.0558,  0.0938],
        [ 0.0449,  0.1941]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0069,  0.1974],
        [-0.2490,  0.0405],
        [ 0.2018,  0.1518],
        [-0.1459,  0.3167],
        [-0.0546,  0.2015],
        [ 0.1875, -0.0748],
        [-0.1297,  0.1921],
        [-0.0901,  0.2530],
        [ 0.0600,  0.2108],
        [-0.0621,  0.1503],
        [-0.2018,  0.3114],
        [-0.0203,  0.2100]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1962,  0.1586],
        [-0.0557,  0.0991],
        [-0.0231,  0.2544],
        [-0.0597,  0.2455],
        [ 0.0288,  0.2123],
        [-0.0639,  0.2289],
        [-0.3192,  0.3878],
        [ 0.2698, -0.0196],
        [ 0.0048,  0.2502],
        [ 0.0049,  0.1872],
        [-0.0881,  0.2063],
        [ 0.0855,  0.2002]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0537,  0.1586],
        [ 0.1734,  0.0673],
        [ 0.1697,  0.0919],
        [ 0.0034,  0.2120],
        [ 0.1260,  0.1264],
        [-0.0720,  0.3026],
        [ 0.1081,  0.1614],
        [-0.2015,  0.2647],
        [ 0.1064,  0.1370],
        [ 0.0570,  0.0975],
        [ 0.1411, -0.0534],
        [ 0.1661,  0.1052]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1438,  0.1512],
        [-0.0464,  0.2222],
        [ 0.0034,  0.3489],
        [ 0.0937,  0.1668],
        [ 0.1793,  0.1639],
        [ 0.0292,  0.2379],
        [-0.1864,  0.2359],
        [ 0.0447,  0.2242],
        [ 0.1047,  0.2127],
        [ 0.0766,  0.0010],
        [-0.0893,  0.1223],
        [ 0.0531,  0.1863]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0632,  0.1806],
        [-0.2560,  0.2544],
        [ 0.0694,  0.2248],
        [ 0.1660,  0.1907],
        [-0.0766,  0.4497],
        [ 0.2023,  0.1013],
        [-0.0878,  0.3279],
        [ 0.0270,  0.2534],
        [ 0.0329,  0.2127],
        [-0.1112,  0.2613],
        [ 0.1212,  0.0862],
        [ 0.1181,  0.2875]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0371,  0.2460],
        [ 0.1596,  0.0969],
        [ 0.1988,  0.1473],
        [ 0.1092,  0.0362],
        [ 0.0326,  0.1774],
        [ 0.1048,  0.0653],
        [ 0.0659,  0.2712],
        [-0.1303,  0.2985],
        [-0.0528,  0.2121],
        [ 0.0032,  0.1439],
        [ 0.0740,  0.0862],
        [-0.0876,  0.1768]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1019, -0.0112],
        [-0.0087,  0.2450],
        [ 0.1475,  0.1409],
        [-0.1995,  0.4616],
        [ 0.0553,  0.2815],
        [ 0.0759,  0.0022],
        [ 0.2232,  0.0523],
        [ 0.1109,  0.1473],
        [-0.0261,  0.0578],
        [ 0.1646,  0.0699],
        [-0.0276,  0.1977],
        [-0.1571,  0.3693]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0286,  0.2165],
        [-0.0185,  0.2126],
        [ 0.1125, -0.0389],
        [-0.0600,  0.2464],
        [-0.1011,  0.2224],
        [ 0.0480,  0.1772],
        [-0.1632,  0.2544],
        [ 0.1584,  0.0288],
        [ 0.0819,  0.1291],
        [-0.0552,  0.1937],
        [-0.1292,  0.2897],
        [-0.0329,  0.0109]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0233,  0.0796],
        [-0.0039,  0.0698],
        [ 0.0572,  0.0239],
        [-0.1023,  0.1950],
        [-0.1216,  0.2570],
        [ 0.0759,  0.0975],
        [-0.1061,  0.2614],
        [-0.1050,  0.3722],
        [-0.0898,  0.2097],
        [ 0.0947,  0.1011],
        [ 0.1999,  0.1245],
        [ 0.2535,  0.0251]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0268,  0.0917],
        [-0.0471,  0.3059],
        [-0.1829,  0.3453],
        [ 0.0041,  0.2680],
        [ 0.2428,  0.1260],
        [ 0.0588,  0.1042],
        [-0.0222,  0.2242],
        [-0.0113,  0.0480],
        [ 0.1599,  0.0481],
        [-0.0441,  0.2210],
        [-0.0202,  0.2768],
        [-0.1200,  0.2314]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0218,  0.2350],
        [-0.0640,  0.2219],
        [ 0.0815,  0.2569],
        [ 0.1071,  0.1034],
        [-0.0643,  0.1180],
        [ 0.0205,  0.1358],
        [-0.2753,  0.3569],
        [-0.0607,  0.0435],
        [ 0.1224,  0.2841],
        [ 0.1458,  0.1260],
        [ 0.0626,  0.0840],
        [ 0.0132,  0.0090]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0325,  0.3309],
        [-0.0858,  0.1433],
        [ 0.0950,  0.0304],
        [-0.0705,  0.3781],
        [ 0.0882,  0.3069],
        [ 0.3988, -0.0756],
        [-0.0086,  0.1774],
        [ 0.0965,  0.0919],
        [ 0.1805, -0.0060],
        [ 0.1553,  0.0552],
        [-0.0037,  0.4279],
        [ 0.0651,  0.1927]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.2362,  0.1274],
        [ 0.1689,  0.1101],
        [ 0.0048,  0.2110],
        [ 0.0483,  0.0707],
        [ 0.1996,  0.1660],
        [-0.1838,  0.4206],
        [-0.0283,  0.1875],
        [ 0.1248,  0.0508],
        [-0.0592,  0.2277],
        [ 0.1097,  0.1648],
        [-0.2136,  0.2864],
        [ 0.0670,  0.1547]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0622,  0.0677],
        [ 0.0975,  0.0214],
        [ 0.1912,  0.1426],
        [ 0.0583,  0.0702],
        [ 0.1291,  0.2084],
        [-0.0405,  0.2367],
        [-0.2077,  0.2329],
        [ 0.0951,  0.2514],
        [ 0.0146,  0.2191],
        [ 0.0411,  0.0297],
        [ 0.1437,  0.1239],
        [ 0.2339,  0.0893]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0920,  0.0446],
        [-0.1283,  0.2021],
        [-0.1754,  0.2337],
        [-0.0812,  0.2173],
        [ 0.0659,  0.3128],
        [ 0.1969,  0.0765],
        [-0.0645,  0.2748],
        [ 0.0703,  0.2500],
        [ 0.0087,  0.1560],
        [ 0.1258,  0.0835],
        [-0.1118,  0.2869],
        [ 0.1417,  0.0673]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0217,  0.1841],
        [-0.1060,  0.2110],
        [-0.0505,  0.1936],
        [-0.0816,  0.3030],
        [ 0.1423,  0.1286],
        [ 0.2403,  0.0460],
        [-0.1660,  0.2250],
        [ 0.0333,  0.1663],
        [ 0.0850,  0.1692],
        [ 0.0478,  0.2511],
        [ 0.2046,  0.2193],
        [-0.0215,  0.2997]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0190,  0.3109],
        [-0.0449,  0.0830],
        [-0.0520,  0.1655],
        [-0.0445,  0.2629],
        [-0.0744,  0.1545],
        [ 0.0032,  0.0671],
        [-0.1619,  0.2690],
        [-0.1974,  0.2202],
        [-0.0272,  0.3383],
        [-0.1869,  0.2467],
        [-0.0493,  0.2117],
        [ 0.0081,  0.1598]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0986,  0.0937],
        [-0.2093,  0.2474],
        [ 0.1350,  0.1217],
        [-0.1890,  0.2981],
        [ 0.1325,  0.0910],
        [ 0.1402,  0.0137],
        [ 0.0758,  0.0472],
        [-0.1299,  0.1976],
        [ 0.0587,  0.0600],
        [ 0.0069,  0.0846],
        [ 0.0101,  0.1617],
        [-0.1374,  0.1969]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0381,  0.1228],
        [ 0.0135,  0.1061],
        [-0.0288,  0.0822],
        [ 0.0293,  0.1326],
        [-0.1559,  0.1918],
        [-0.0532,  0.2897],
        [-0.0448,  0.1578],
        [ 0.0683,  0.0442],
        [ 0.0488,  0.1138],
        [-0.0502,  0.1512],
        [-0.0856,  0.2941],
        [ 0.0637,  0.1615]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0408,  0.1656],
        [ 0.1138,  0.1446],
        [ 0.0903,  0.0553],
        [ 0.1084,  0.1424],
        [-0.1171,  0.3410],
        [-0.0291,  0.3183],
        [-0.0196,  0.2526],
        [-0.2712,  0.2867],
        [-0.0089,  0.2017],
        [ 0.0674,  0.2096],
        [ 0.0580,  0.1667],
        [ 0.2891,  0.0519]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0617,  0.0208],
        [ 0.0075,  0.1585],
        [-0.1027,  0.2745],
        [-0.1017,  0.1049],
        [ 0.2260,  0.0335],
        [ 0.0689,  0.1894],
        [-0.1604,  0.2370],
        [ 0.0506,  0.2477],
        [ 0.0879,  0.1598],
        [ 0.0477,  0.1870],
        [ 0.0678,  0.1047],
        [ 0.0947,  0.1694]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0550,  0.2261],
        [-0.0270,  0.1906],
        [ 0.1635,  0.0303],
        [-0.0094,  0.2449],
        [ 0.0901,  0.1250],
        [ 0.0393,  0.2568],
        [-0.0140,  0.2781],
        [-0.0686,  0.2365],
        [ 0.0293,  0.2799],
        [ 0.2935,  0.0310],
        [-0.1371,  0.2365],
        [ 0.2547,  0.0850]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0343,  0.2679],
        [ 0.2359, -0.0021],
        [ 0.2415,  0.1084],
        [-0.0165,  0.1084],
        [ 0.1054,  0.1320],
        [ 0.1692, -0.1206],
        [ 0.2665,  0.0812],
        [-0.0300,  0.0976],
        [ 0.2376,  0.1182],
        [ 0.0310,  0.0696],
        [-0.1128,  0.2887],
        [ 0.0886,  0.1210]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1020,  0.2974],
        [ 0.0681,  0.1623],
        [ 0.0237,  0.1503],
        [-0.0227,  0.1078],
        [ 0.2888,  0.1580],
        [-0.0599,  0.1960],
        [-0.0275,  0.2360],
        [ 0.2746,  0.0551],
        [-0.0811,  0.2015],
        [-0.0625,  0.1267],
        [ 0.0274,  0.1927],
        [ 0.0168,  0.2640]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0066,  0.2582],
        [ 0.1846,  0.0723],
        [ 0.2014,  0.1192],
        [ 0.1032,  0.1995],
        [ 0.0284,  0.1688],
        [ 0.0107,  0.2822],
        [ 0.0162,  0.3136],
        [-0.0795,  0.2645],
        [ 0.1231,  0.0914],
        [ 0.1399,  0.0814],
        [ 0.1895,  0.2064],
        [ 0.2277,  0.1250]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1189,  0.1352],
        [ 0.0746,  0.2053],
        [-0.0983,  0.3344],
        [-0.0459,  0.1424],
        [ 0.2312,  0.1916],
        [ 0.1304,  0.2123],
        [-0.1255,  0.3090],
        [-0.0075,  0.1297],
        [-0.0288,  0.1367],
        [-0.0406,  0.1931],
        [ 0.0538,  0.1946],
        [ 0.1163,  0.1252]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1204,  0.0937],
        [-0.0650,  0.2820],
        [ 0.1170,  0.1313],
        [ 0.0774,  0.0917],
        [ 0.2027,  0.1480],
        [ 0.2431,  0.0026],
        [-0.0368,  0.2681],
        [ 0.2786, -0.0823],
        [ 0.1979,  0.1044],
        [-0.0697,  0.2578],
        [ 0.1189,  0.0434],
        [ 0.0781,  0.1696]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0961,  0.1346],
        [ 0.0386, -0.0034],
        [ 0.1024,  0.0949],
        [-0.0657,  0.2507],
        [-0.0101,  0.3780],
        [ 0.1422,  0.1158],
        [ 0.0438,  0.1966],
        [-0.1277,  0.3294],
        [-0.0066,  0.3725],
        [ 0.1246,  0.2155],
        [-0.0776,  0.1888],
        [-0.0493,  0.2591]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0037,  0.2872],
        [-0.0904,  0.2801],
        [ 0.0038,  0.2408],
        [-0.1189,  0.4821],
        [ 0.0943,  0.1734],
        [ 0.1800,  0.1387],
        [ 0.0087,  0.2520],
        [ 0.1785,  0.1252],
        [-0.0037,  0.3606],
        [ 0.0992,  0.1006],
        [-0.1445,  0.2890],
        [-0.2191,  0.4493]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0164,  0.2658],
        [-0.1772,  0.2220],
        [ 0.1523,  0.1905],
        [ 0.0312,  0.1546],
        [ 0.0284,  0.2293],
        [ 0.1355,  0.0888],
        [-0.0982,  0.3608],
        [ 0.1042,  0.1236],
        [ 0.1294,  0.2073],
        [-0.0976,  0.2814],
        [-0.1161,  0.3490],
        [ 0.0813,  0.2247]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0691,  0.2290],
        [ 0.0531,  0.0537],
        [ 0.2931,  0.0031],
        [ 0.0226,  0.0470],
        [-0.1455,  0.3209],
        [ 0.1218,  0.1830],
        [ 0.0238,  0.1886],
        [-0.0519,  0.3297],
        [ 0.1116,  0.2101],
        [ 0.1055,  0.0683],
        [ 0.1201,  0.1352],
        [ 0.2547, -0.0047]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.1243,  0.1241],
        [ 0.0146,  0.2931],
        [-0.1175,  0.3463],
        [ 0.0633,  0.1024],
        [ 0.2652,  0.0490],
        [ 0.0530,  0.1331],
        [-0.0661,  0.1827],
        [ 0.0684,  0.2201],
        [ 0.1372,  0.1206],
        [-0.0101,  0.1811],
        [-0.0425,  0.1852],
        [ 0.0956,  0.2541]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0516,  0.2064],
        [ 0.1135,  0.1377],
        [-0.0591,  0.1578],
        [ 0.1741,  0.1535],
        [-0.0016,  0.2877],
        [ 0.0873,  0.2775],
        [ 0.0486,  0.2976],
        [ 0.0418,  0.0996],
        [-0.0427,  0.2652],
        [ 0.3137, -0.0417],
        [-0.1050,  0.0864],
        [ 0.2974,  0.0696]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1559,  0.2453],
        [ 0.0793,  0.1287],
        [ 0.2112,  0.0695],
        [-0.0906,  0.3295],
        [ 0.0965,  0.2279],
        [ 0.3338, -0.0621],
        [ 0.0541,  0.2189],
        [ 0.0073,  0.1926],
        [ 0.0125,  0.1036],
        [ 0.0429,  0.0843],
        [-0.2062,  0.2603],
        [ 0.1153,  0.1746]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1584,  0.2684],
        [ 0.0820,  0.1479],
        [-0.0587,  0.2762],
        [ 0.1884,  0.0802],
        [ 0.1581,  0.1542],
        [-0.1047,  0.3594],
        [-0.1726,  0.3268],
        [ 0.0869,  0.2068],
        [-0.0135,  0.2662],
        [-0.2285,  0.1957],
        [-0.1414,  0.3244],
        [ 0.0284,  0.2180]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0516,  0.1636],
        [ 0.0342,  0.2018],
        [ 0.2209,  0.2387],
        [-0.0298,  0.2919],
        [ 0.0484,  0.3023],
        [-0.0652,  0.1829],
        [-0.2251,  0.2944],
        [-0.0892,  0.3607],
        [-0.0799,  0.2608],
        [ 0.0998,  0.0317],
        [ 0.0935,  0.2418],
        [-0.0109,  0.2552]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0467,  0.1925],
        [ 0.0027,  0.2366],
        [-0.0846,  0.3479],
        [ 0.0198,  0.1739],
        [ 0.1556,  0.2316],
        [ 0.1670,  0.2162],
        [-0.2636,  0.2717],
        [ 0.0585,  0.2224],
        [-0.0212,  0.2693],
        [-0.0276,  0.3415],
        [ 0.0167,  0.2587],
        [ 0.0253,  0.0758]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0667,  0.2164],
        [-0.0331,  0.1912],
        [-0.0816,  0.3168],
        [ 0.0791,  0.1018],
        [ 0.1175,  0.0946],
        [ 0.0740,  0.0306],
        [ 0.0166,  0.1477],
        [ 0.1324,  0.1028],
        [ 0.0833,  0.0870],
        [ 0.0134,  0.2187],
        [ 0.1894,  0.1127],
        [-0.0063,  0.1656]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1943,  0.1762],
        [ 0.0898,  0.0206],
        [ 0.0846,  0.1273],
        [ 0.1039, -0.0438],
        [ 0.0417,  0.1646],
        [ 0.2262, -0.1083],
        [-0.0100,  0.1406],
        [-0.0030,  0.3255],
        [ 0.0845,  0.2927],
        [ 0.1553,  0.1054],
        [ 0.1267,  0.0667],
        [ 0.1219,  0.2394]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0636,  0.1612],
        [-0.1202,  0.1991],
        [-0.1467,  0.1614],
        [-0.0731,  0.3877],
        [ 0.2542,  0.0677],
        [ 0.0230,  0.2050],
        [ 0.2196,  0.1117],
        [ 0.0273,  0.1226],
        [-0.0053,  0.3536],
        [ 0.0358,  0.2701],
        [ 0.0569,  0.0725],
        [-0.0224,  0.4124]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0462,  0.2260],
        [-0.0444,  0.3327],
        [ 0.1364,  0.1004],
        [ 0.0856,  0.2046],
        [-0.1234,  0.3074],
        [-0.0042,  0.2508],
        [-0.1198,  0.2643],
        [ 0.0272,  0.2148],
        [ 0.0322,  0.2177],
        [-0.1336,  0.3248],
        [-0.0314,  0.3327],
        [ 0.1423,  0.2288]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0309,  0.2667],
        [-0.0497,  0.1381],
        [ 0.0674,  0.1192],
        [ 0.1127,  0.1606],
        [-0.1218,  0.2288],
        [ 0.1025,  0.1801],
        [-0.0766,  0.3495],
        [-0.0814,  0.3511],
        [ 0.0802,  0.1813],
        [-0.0035,  0.2011],
        [ 0.0790,  0.1146],
        [ 0.2409,  0.0518]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0160,  0.3035],
        [ 0.0969,  0.1928],
        [-0.0984,  0.2923],
        [ 0.0890,  0.2183],
        [ 0.2859,  0.0562],
        [ 0.0111,  0.1297],
        [-0.0251,  0.2713],
        [ 0.1332,  0.1704],
        [ 0.0614,  0.2107],
        [-0.0217,  0.2212],
        [ 0.0130,  0.3659],
        [-0.0389,  0.2730]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0794,  0.2253],
        [-0.1033,  0.2525],
        [-0.0326,  0.1939],
        [-0.0280,  0.3845],
        [-0.1148,  0.2036],
        [-0.0103,  0.1542],
        [-0.0763,  0.2459],
        [-0.0148,  0.1444],
        [ 0.1239,  0.1802],
        [ 0.2681,  0.0307],
        [-0.0193,  0.2407],
        [ 0.0905,  0.2111]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1050,  0.3024],
        [-0.0944,  0.1806],
        [ 0.1579,  0.0747],
        [-0.0850,  0.3179],
        [ 0.0753,  0.1613],
        [ 0.3869, -0.0602],
        [ 0.0264,  0.3042],
        [-0.0031,  0.1368],
        [ 0.1492,  0.2615],
        [ 0.1167,  0.0125],
        [-0.1237,  0.3994],
        [ 0.1429,  0.0832]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1325,  0.2371],
        [ 0.0649,  0.1607],
        [-0.0572,  0.3064],
        [ 0.0250,  0.2226],
        [ 0.0870,  0.2150],
        [-0.0296,  0.3772],
        [-0.2578,  0.3445],
        [ 0.0399,  0.0636],
        [-0.1731,  0.1971],
        [ 0.0474,  0.0476],
        [-0.1394,  0.3491],
        [-0.1504,  0.3108]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.1090,  0.2512],
        [ 0.0901,  0.1438],
        [ 0.0129,  0.2167],
        [ 0.0752,  0.2445],
        [-0.0068,  0.2992],
        [-0.0232,  0.3642],
        [-0.1083,  0.3676],
        [ 0.2348,  0.1983],
        [ 0.0401,  0.1654],
        [ 0.0425,  0.3359],
        [-0.1173,  0.0684],
        [ 0.1805,  0.0617]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0350,  0.2365],
        [ 0.0356,  0.2398],
        [-0.1413,  0.3285],
        [ 0.1180,  0.1469],
        [ 0.0054,  0.2234],
        [ 0.0708,  0.1370],
        [-0.1691,  0.2510],
        [ 0.1427,  0.1351],
        [ 0.0140,  0.0669],
        [ 0.0851,  0.1949],
        [-0.0983,  0.2745],
        [-0.0503,  0.1737]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.2068,  0.1558],
        [ 0.0118,  0.2186],
        [-0.0005,  0.2116],
        [-0.0922,  0.2629],
        [ 0.1441,  0.1701],
        [ 0.1974,  0.1608],
        [-0.2336,  0.3813],
        [ 0.3696, -0.0449],
        [ 0.0217,  0.1582],
        [ 0.0669,  0.0521],
        [ 0.0387,  0.2908],
        [ 0.0419,  0.1500]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1368,  0.2109],
        [ 0.1402,  0.0643],
        [ 0.1070,  0.0555],
        [-0.0048,  0.1517],
        [ 0.0709,  0.1789],
        [ 0.2358,  0.0858],
        [ 0.0198,  0.1222],
        [-0.1770,  0.3488],
        [ 0.0592,  0.3446],
        [ 0.1811,  0.1104],
        [-0.0280,  0.2731],
        [-0.0422,  0.1755]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0187,  0.1099],
        [-0.0693,  0.2532],
        [ 0.0988,  0.1822],
        [-0.2178,  0.4320],
        [ 0.1599,  0.1025],
        [ 0.2226,  0.1363],
        [ 0.0233,  0.1659],
        [ 0.0705,  0.0998],
        [ 0.0397,  0.1820],
        [ 0.0579,  0.1302],
        [ 0.0494,  0.0430],
        [ 0.0356,  0.3206]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0533,  0.1058],
        [ 0.0491,  0.0937],
        [ 0.2162,  0.0522],
        [ 0.0307,  0.1103],
        [-0.0924,  0.2335],
        [ 0.1320,  0.1028],
        [ 0.0387,  0.0926],
        [ 0.1293, -0.0040],
        [ 0.1927,  0.1449],
        [-0.1093,  0.2738],
        [ 0.0540,  0.1401],
        [ 0.0157,  0.0965]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0044,  0.2298],
        [ 0.2302,  0.0971],
        [-0.0691,  0.1739],
        [ 0.1225, -0.0183],
        [-0.0336,  0.2543],
        [-0.0752,  0.1830],
        [-0.0918,  0.2816],
        [-0.0807,  0.3391],
        [ 0.1839,  0.0916],
        [-0.0084,  0.1798],
        [ 0.0641,  0.2131],
        [ 0.1789,  0.0026]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.1716,  0.1274],
        [-0.0234,  0.2223],
        [-0.0707,  0.1621],
        [ 0.0589,  0.1244],
        [ 0.2500, -0.0083],
        [ 0.0352,  0.2284],
        [-0.0949,  0.3200],
        [ 0.0870,  0.0858],
        [ 0.0501,  0.0433],
        [ 0.0790,  0.1833],
        [ 0.0923,  0.1811],
        [ 0.0719,  0.1887]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0815,  0.0984],
        [-0.0496,  0.1393],
        [ 0.0344,  0.0902],
        [ 0.0738,  0.1334],
        [-0.0021,  0.1770],
        [ 0.0219,  0.1683],
        [-0.0633,  0.2120],
        [-0.0605,  0.1691],
        [ 0.0171,  0.0902],
        [ 0.1464,  0.1122],
        [ 0.0477,  0.2213],
        [ 0.2684,  0.0509]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0252,  0.2741],
        [-0.0562,  0.0902],
        [ 0.2643, -0.0563],
        [-0.0589,  0.1546],
        [ 0.2923, -0.0533],
        [ 0.3737, -0.1739],
        [-0.0345,  0.2242],
        [ 0.1460,  0.2039],
        [ 0.1318,  0.0181],
        [ 0.2578,  0.0677],
        [-0.1207,  0.2453],
        [ 0.0502,  0.0302]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1224,  0.1254],
        [-0.0181,  0.0974],
        [ 0.0211,  0.1764],
        [ 0.1602,  0.1198],
        [ 0.1416,  0.0821],
        [-0.0697,  0.3278],
        [-0.1178,  0.3276],
        [ 0.1606,  0.0565],
        [-0.0962,  0.2610],
        [ 0.1168,  0.0828],
        [-0.0259,  0.2333],
        [-0.0073,  0.2005]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0492,  0.1685],
        [ 0.1654,  0.2043],
        [ 0.1336,  0.2200],
        [-0.0859,  0.2545],
        [ 0.0874,  0.2083],
        [-0.1025,  0.2840],
        [-0.1359,  0.2228],
        [ 0.0231,  0.1329],
        [-0.0102,  0.2100],
        [-0.0217,  0.1738],
        [-0.0423,  0.1629],
        [ 0.1225,  0.0682]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1207,  0.2181],
        [ 0.0126,  0.1761],
        [-0.0562,  0.1182],
        [-0.0763,  0.1459],
        [ 0.0982,  0.1307],
        [ 0.1190,  0.0007],
        [-0.1578,  0.2946],
        [ 0.0743,  0.0113],
        [ 0.1411,  0.1314],
        [ 0.0397,  0.1921],
        [-0.0617,  0.2035],
        [ 0.0146,  0.0613]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0478,  0.0996],
        [-0.1937,  0.3522],
        [ 0.0201,  0.2068],
        [ 0.0038,  0.2289],
        [-0.0507,  0.2828],
        [ 0.1397,  0.1696],
        [-0.1442,  0.2431],
        [ 0.1610,  0.0820],
        [ 0.0644,  0.1261],
        [-0.2055,  0.2939],
        [ 0.1576,  0.2878],
        [-0.0330,  0.2267]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0948,  0.2370],
        [ 0.0728,  0.0153],
        [ 0.1277,  0.1415],
        [ 0.0162,  0.1294],
        [ 0.0976,  0.1398],
        [ 0.1285, -0.0921],
        [ 0.0105,  0.1788],
        [-0.1677,  0.1958],
        [ 0.1175,  0.1369],
        [ 0.1101,  0.2021],
        [-0.0115,  0.1417],
        [ 0.0967,  0.1778]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0248,  0.1618],
        [-0.1098,  0.2949],
        [ 0.0580,  0.2349],
        [-0.1216,  0.3415],
        [-0.0071,  0.2479],
        [ 0.2565,  0.0587],
        [ 0.0249,  0.1198],
        [ 0.0465,  0.0448],
        [-0.0339,  0.2220],
        [ 0.0433,  0.1706],
        [ 0.1056,  0.1055],
        [-0.0521,  0.2703]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0117,  0.2538],
        [-0.1076,  0.1726],
        [ 0.0752,  0.1652],
        [-0.0253,  0.2726],
        [-0.1328,  0.2498],
        [-0.0136,  0.1935],
        [-0.0051,  0.2630],
        [-0.0656,  0.1155],
        [ 0.0111,  0.1848],
        [-0.1347,  0.3367],
        [-0.1077,  0.3800],
        [ 0.1418,  0.2177]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0543,  0.2616],
        [ 0.0940,  0.0469],
        [ 0.1685,  0.1699],
        [ 0.1030,  0.1823],
        [-0.1308,  0.3776],
        [ 0.1959,  0.1046],
        [ 0.0285,  0.2105],
        [-0.0544,  0.2726],
        [ 0.0523,  0.1334],
        [-0.1350,  0.2216],
        [ 0.0200,  0.1447],
        [ 0.2430,  0.0422]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0204,  0.1621],
        [ 0.0259,  0.2136],
        [-0.0522,  0.1666],
        [-0.1299,  0.2779],
        [ 0.3159,  0.0193],
        [ 0.1425,  0.0350],
        [ 0.0909,  0.2233],
        [ 0.1091,  0.1760],
        [ 0.1830,  0.0908],
        [-0.1434,  0.1816],
        [-0.0734,  0.1337],
        [ 0.0737,  0.1693]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0657,  0.0654],
        [ 0.1498,  0.0787],
        [ 0.1179,  0.0783],
        [ 0.0887,  0.0276],
        [-0.0814,  0.1481],
        [ 0.0083,  0.0927],
        [ 0.0262,  0.0456],
        [ 0.0248,  0.1880],
        [-0.0578,  0.1508],
        [ 0.2381,  0.1693],
        [ 0.0532,  0.1651],
        [ 0.2256,  0.0306]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[ 0.0405,  0.1593],
        [ 0.0720,  0.2860],
        [ 0.0424,  0.0717],
        [-0.1601,  0.3290],
        [ 0.0250,  0.1255],
        [ 0.2136, -0.0728],
        [-0.1204,  0.2080],
        [ 0.1242, -0.0196],
        [ 0.2128, -0.0128],
        [ 0.0649,  0.0293],
        [-0.1363,  0.3586],
        [ 0.1032,  0.0945]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1353,  0.2464],
        [ 0.0147,  0.0833],
        [-0.0026,  0.2450],
        [-0.0848,  0.2046],
        [ 0.1688,  0.0861],
        [-0.2041,  0.4183],
        [-0.3153,  0.3115],
        [-0.0050,  0.1189],
        [-0.0489,  0.2688],
        [-0.0390,  0.0918],
        [-0.1611,  0.3478],
        [ 0.0450,  0.1584]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0390,  0.1901],
        [ 0.1532,  0.1861],
        [ 0.2058,  0.0798],
        [ 0.0613,  0.1125],
        [-0.0103,  0.2619],
        [-0.0558,  0.3610],
        [-0.1604,  0.2395],
        [ 0.1156,  0.2514],
        [-0.0065,  0.1970],
        [ 0.1505, -0.0229],
        [ 0.0214,  0.1964],
        [ 0.1124,  0.1122]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0376,  0.2977],
        [-0.1238,  0.1721],
        [-0.0493,  0.2740],
        [-0.0079,  0.1765],
        [ 0.0606,  0.2136],
        [ 0.0881,  0.2433],
        [-0.2450,  0.2546],
        [-0.2091,  0.2864],
        [-0.0533,  0.2469],
        [-0.0986,  0.2760],
        [-0.1284,  0.4562],
        [ 0.0460,  0.0902]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0440,  0.1607],
        [-0.1512,  0.3418],
        [ 0.0896,  0.3312],
        [-0.0175,  0.2233],
        [ 0.1347,  0.1914],
        [ 0.0963,  0.2248],
        [-0.0321,  0.1909],
        [ 0.2263, -0.0114],
        [ 0.0052,  0.0960],
        [-0.1660,  0.3381],
        [ 0.0575,  0.0768],
        [-0.0140,  0.2083]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0511,  0.0856],
        [ 0.0971,  0.1104],
        [ 0.1516,  0.0425],
        [-0.0601,  0.1967],
        [-0.1074,  0.2179],
        [ 0.0502,  0.1022],
        [-0.1071,  0.1708],
        [-0.1565,  0.2493],
        [ 0.1958,  0.2057],
        [ 0.0798,  0.2090],
        [ 0.0139,  0.1545],
        [-0.0322,  0.2135]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1474,  0.1772],
        [-0.0504,  0.0916],
        [ 0.0735,  0.0963],
        [-0.0320,  0.2185],
        [ 0.1643,  0.1312],
        [ 0.0528, -0.0777],
        [ 0.0575,  0.1792],
        [-0.0481,  0.1173],
        [-0.1198,  0.1699],
        [ 0.0226,  0.0514],
        [-0.1017,  0.2164],
        [-0.0045,  0.2944]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0409,  0.2706],
        [-0.0577,  0.2736],
        [ 0.0444,  0.1909],
        [-0.0502,  0.1568],
        [-0.2230,  0.1114],
        [-0.0359,  0.2027],
        [-0.1666,  0.2416],
        [ 0.1909, -0.0527],
        [-0.0471,  0.3248],
        [-0.2362,  0.2999],
        [-0.0343,  0.1974],
        [ 0.0748,  0.2679]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-1.8348e-02,  6.6585e-02],
        [-5.8818e-02,  8.5385e-02],
        [-8.8536e-03,  7.9276e-02],
        [ 1.3076e-01,  4.6625e-02],
        [-1.5378e-01,  3.4871e-01],
        [ 7.5929e-02,  9.2387e-02],
        [-1.9352e-01,  2.4126e-01],
        [-2.1987e-01,  3.0286e-01],
        [ 5.6544e-02,  2.9066e-02],
        [ 8.0666e-02,  3.6148e-02],
        [-2.4664e-04,  2.2563e-01],
        [ 5.8783e-02,  1.5717e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0376,  0.0529],
        [ 0.0427,  0.1352],
        [-0.1515,  0.1924],
        [ 0.0508,  0.2225],
        [ 0.2575,  0.0220],
        [ 0.2556,  0.0148],
        [ 0.2212,  0.1895],
        [ 0.1088,  0.0933],
        [ 0.1202,  0.0341],
        [ 0.1409,  0.2127],
        [ 0.0824,  0.2360],
        [ 0.1696,  0.1378]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1383,  0.3128],
        [-0.2018,  0.1832],
        [-0.0453,  0.3348],
        [ 0.0574,  0.1605],
        [ 0.0777,  0.0633],
        [ 0.1376,  0.0198],
        [-0.0533,  0.1796],
        [-0.0375,  0.1106],
        [ 0.0941,  0.0610],
        [ 0.1408,  0.1698],
        [ 0.0219,  0.2681],
        [ 0.2210, -0.0343]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1702,  0.2085],
        [ 0.1051,  0.1309],
        [ 0.0474, -0.0915],
        [-0.2633,  0.3137],
        [ 0.0837,  0.2420],
        [ 0.3147, -0.1551],
        [-0.0047,  0.2620],
        [-0.0100,  0.1786],
        [ 0.1746,  0.0757],
        [-0.0440,  0.1331],
        [-0.2748,  0.3605],
        [-0.0944,  0.0378]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1061,  0.1661],
        [ 0.1659,  0.0212],
        [ 0.0235,  0.1274],
        [ 0.1718,  0.0774],
        [ 0.2643,  0.0420],
        [ 0.0742,  0.2360],
        [-0.0930,  0.3262],
        [ 0.1140,  0.1184],
        [-0.0405,  0.1428],
        [ 0.0425,  0.1513],
        [-0.0769,  0.2087],
        [ 0.0774,  0.2224]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.1353,  0.2476],
        [ 0.1794, -0.0731],
        [ 0.1275,  0.2140],
        [ 0.0499,  0.0486],
        [ 0.0524,  0.0863],
        [-0.0887,  0.2205],
        [-0.0607,  0.1536],
        [ 0.1198,  0.1061],
        [ 0.0289,  0.2220],
        [-0.0407,  0.1364],
        [ 0.1181,  0.0556],
        [ 0.2214, -0.0354]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0597,  0.1158],
        [ 0.0421,  0.2668],
        [-0.1611,  0.3712],
        [ 0.0691,  0.1350],
        [ 0.0511,  0.1447],
        [ 0.1649,  0.1491],
        [-0.1728,  0.4000],
        [ 0.0153,  0.1048],
        [ 0.0279,  0.3053],
        [ 0.1540,  0.1488],
        [-0.0932,  0.2797],
        [-0.0143,  0.1346]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0447,  0.2156],
        [-0.1755,  0.3030],
        [-0.0266,  0.1109],
        [-0.0059,  0.1015],
        [-0.1238,  0.2477],
        [-0.0177,  0.0694],
        [-0.1234,  0.1731],
        [ 0.2936, -0.0907],
        [ 0.1071,  0.1646],
        [-0.0716,  0.2267],
        [ 0.1030,  0.2169],
        [ 0.0291,  0.1901]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.2021, -0.0010],
        [ 0.1029,  0.2153],
        [ 0.1607,  0.0744],
        [ 0.0793,  0.1264],
        [ 0.0479,  0.1997],
        [ 0.1481, -0.0217],
        [ 0.1518,  0.1335],
        [-0.2017,  0.3183],
        [ 0.1181,  0.1560],
        [ 0.1027,  0.0870],
        [ 0.0756,  0.0976],
        [ 0.0727,  0.0358]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1222,  0.2664],
        [-0.1086,  0.2576],
        [ 0.1787,  0.0866],
        [ 0.0148,  0.2679],
        [ 0.0922,  0.0187],
        [ 0.1601,  0.0856],
        [-0.0211,  0.2078],
        [ 0.0027,  0.1725],
        [ 0.0094,  0.1821],
        [ 0.1373,  0.0783],
        [-0.1168,  0.1266],
        [-0.1356,  0.3350]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0134,  0.0986],
        [-0.1050,  0.2940],
        [ 0.0294,  0.0472],
        [-0.0668,  0.2625],
        [-0.2243,  0.2675],
        [-0.0574,  0.2309],
        [-0.0951,  0.2247],
        [ 0.1113,  0.0564],
        [ 0.0545,  0.1432],
        [-0.1398,  0.4407],
        [-0.0472,  0.1693],
        [ 0.0475,  0.2896]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.1730,  0.1496],
        [ 0.1386,  0.0863],
        [ 0.1971,  0.1022],
        [-0.0051,  0.1276],
        [ 0.0784,  0.0150],
        [ 0.2202, -0.0611],
        [ 0.0807,  0.1788],
        [-0.0193,  0.2672],
        [-0.1531,  0.2136],
        [-0.0065,  0.2590],
        [ 0.1242,  0.0965],
        [ 0.1762,  0.1206]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.1823,  0.1186],
        [ 0.1092,  0.0320],
        [-0.0531,  0.3497],
        [-0.1863,  0.2522],
        [ 0.2634,  0.0016],
        [ 0.0098,  0.3202],
        [-0.2570,  0.2964],
        [ 0.0179,  0.1954],
        [ 0.0721,  0.0894],
        [-0.0674,  0.2027],
        [-0.1531,  0.3403],
        [ 0.0115,  0.2548]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0130,  0.1873],
        [-0.0140,  0.1948],
        [ 0.0120,  0.1474],
        [ 0.1662,  0.0265],
        [ 0.0185,  0.1158],
        [ 0.0676,  0.1401],
        [-0.0996,  0.1913],
        [-0.0867,  0.2142],
        [-0.0897,  0.1814],
        [ 0.2513, -0.0407],
        [-0.1253,  0.1950],
        [ 0.1623,  0.1652]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1008,  0.1849],
        [-0.0499,  0.1556],
        [ 0.2184,  0.0968],
        [-0.0452,  0.3278],
        [ 0.2988,  0.0264],
        [ 0.2407,  0.0353],
        [ 0.0344,  0.0531],
        [ 0.1497,  0.0463],
        [ 0.0046,  0.1008],
        [ 0.1364,  0.0353],
        [-0.0848,  0.2552],
        [-0.0101,  0.1226]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1482,  0.1202],
        [-0.0025,  0.2044],
        [ 0.0632,  0.2064],
        [-0.0078,  0.2721],
        [ 0.0672,  0.0972],
        [ 0.0281,  0.1770],
        [-0.1292,  0.1754],
        [-0.0730,  0.2367],
        [-0.0050,  0.2355],
        [ 0.0398,  0.1811],
        [-0.1738,  0.4610],
        [ 0.0354,  0.1063]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0428,  0.1424],
        [ 0.0186,  0.1412],
        [ 0.0035,  0.0241],
        [-0.0402,  0.1110],
        [ 0.0050,  0.1981],
        [-0.0484,  0.2331],
        [-0.0895,  0.2888],
        [ 0.0164,  0.2580],
        [ 0.0938,  0.1746],
        [ 0.0449,  0.1169],
        [ 0.0256,  0.2375],
        [ 0.0808,  0.0818]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1380,  0.2939],
        [ 0.0726,  0.1106],
        [ 0.0159,  0.2362],
        [ 0.0816,  0.2533],
        [-0.0112,  0.3267],
        [-0.0019,  0.1614],
        [-0.2365,  0.3337],
        [-0.1000,  0.2791],
        [ 0.0272,  0.3512],
        [-0.0446,  0.2739],
        [ 0.0022,  0.1438],
        [ 0.1315,  0.0845]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0786,  0.2748],
        [ 0.0941,  0.1731],
        [ 0.0513,  0.2474],
        [-0.0301,  0.1953],
        [ 0.1431,  0.2172],
        [ 0.0043,  0.2280],
        [-0.1002,  0.1990],
        [ 0.2239, -0.0086],
        [ 0.1497, -0.0320],
        [-0.0047,  0.2167],
        [ 0.1302,  0.0861],
        [ 0.1816,  0.1752]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0015,  0.1585],
        [ 0.0615,  0.1024],
        [ 0.0415,  0.2037],
        [-0.0123,  0.1388],
        [ 0.0959,  0.2538],
        [ 0.1260,  0.1924],
        [-0.0925,  0.2070],
        [-0.0072,  0.1154],
        [ 0.2062,  0.1450],
        [ 0.0958,  0.2513],
        [ 0.0203,  0.1279],
        [-0.1341,  0.2195]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.2212, -0.0051],
        [-0.0678,  0.1642],
        [ 0.1315,  0.1683],
        [-0.1609,  0.2425],
        [ 0.1626, -0.0545],
        [ 0.0379,  0.0523],
        [ 0.0236,  0.2547],
        [ 0.1509,  0.0745],
        [-0.0115,  0.2410],
        [ 0.1105,  0.0133],
        [ 0.0502,  0.1471],
        [-0.2521,  0.3849]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0770,  0.2212],
        [ 0.0686,  0.3043],
        [ 0.0703,  0.1377],
        [-0.0395,  0.2124],
        [-0.1103,  0.1935],
        [-0.1798,  0.2980],
        [-0.1613,  0.2312],
        [ 0.1633,  0.1123],
        [ 0.1834,  0.1015],
        [-0.0228,  0.2856],
        [-0.0678,  0.1854],
        [ 0.1398,  0.1043]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0322,  0.2350],
        [ 0.0840,  0.0919],
        [-0.2352,  0.3563],
        [ 0.1386,  0.0320],
        [-0.1624,  0.2334],
        [-0.0095,  0.0908],
        [-0.0487,  0.1118],
        [-0.0383,  0.1912],
        [-0.1518,  0.3258],
        [-0.0096,  0.1302],
        [ 0.0121,  0.1533],
        [ 0.2973, -0.0740]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0322,  0.1631],
        [-0.1151,  0.2807],
        [-0.1731,  0.2497],
        [-0.0910,  0.2048],
        [ 0.4057, -0.1304],
        [ 0.0817,  0.0654],
        [-0.0104,  0.1943],
        [ 0.0689,  0.2183],
        [ 0.0317,  0.1575],
        [-0.0228,  0.2096],
        [ 0.0453,  0.1624],
        [ 0.0711,  0.2460]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0464,  0.2421],
        [-0.1090,  0.1932],
        [-0.0015,  0.1470],
        [ 0.0266,  0.1834],
        [-0.0223,  0.0316],
        [ 0.1281,  0.1479],
        [-0.1210,  0.3641],
        [ 0.0278,  0.2590],
        [-0.1307,  0.2948],
        [ 0.2538,  0.0160],
        [-0.0288,  0.1609],
        [ 0.1605,  0.0854]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0925,  0.2991],
        [-0.0220,  0.1945],
        [ 0.0034,  0.1615],
        [-0.1419,  0.2920],
        [ 0.1295,  0.1582],
        [ 0.1315,  0.1310],
        [ 0.0642,  0.2308],
        [ 0.1100,  0.1979],
        [ 0.0340,  0.0751],
        [ 0.0593,  0.1888],
        [-0.1741,  0.3456],
        [ 0.0419,  0.2807]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1445,  0.0616],
        [-0.2128,  0.2683],
        [-0.0588,  0.3937],
        [-0.1899,  0.2614],
        [-0.0322,  0.1698],
        [-0.0410,  0.2418],
        [-0.1836,  0.1819],
        [ 0.1191,  0.0702],
        [-0.0724,  0.3193],
        [ 0.1371,  0.0673],
        [-0.1592,  0.3310],
        [-0.0828,  0.3416]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0508,  0.0722],
        [-0.0235,  0.2427],
        [ 0.1576,  0.0594],
        [ 0.1047,  0.0455],
        [ 0.1450,  0.2253],
        [-0.0733,  0.2213],
        [-0.0748,  0.2319],
        [ 0.1568,  0.1274],
        [ 0.0273,  0.2445],
        [-0.2256,  0.3362],
        [-0.0605,  0.2308],
        [ 0.0148,  0.1502]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0013,  0.0657],
        [ 0.1195,  0.0550],
        [ 0.0613,  0.0928],
        [ 0.1554,  0.0380],
        [ 0.0460,  0.1881],
        [-0.0056,  0.0253],
        [-0.1822,  0.2693],
        [ 0.0268,  0.2810],
        [ 0.0934,  0.1247],
        [-0.0074,  0.2331],
        [ 0.0538,  0.1732],
        [ 0.0024,  0.1092]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0130,  0.1734],
        [-0.0992,  0.2782],
        [ 0.0858,  0.0681],
        [ 0.0235,  0.1695],
        [ 0.0684,  0.1375],
        [ 0.1125,  0.0662],
        [-0.2517,  0.2505],
        [ 0.4494, -0.0234],
        [ 0.0859,  0.1296],
        [-0.1325,  0.2073],
        [ 0.0359,  0.1053],
        [ 0.1572,  0.0804]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1143,  0.0283],
        [ 0.0236,  0.0084],
        [ 0.1229,  0.1252],
        [ 0.0112,  0.2135],
        [-0.0428,  0.2235],
        [ 0.0659,  0.1338],
        [-0.0334,  0.2587],
        [-0.0537,  0.1845],
        [ 0.1706,  0.2202],
        [ 0.0623,  0.0425],
        [-0.0537,  0.1590],
        [ 0.0244,  0.2048]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0035,  0.2690],
        [-0.2530,  0.1994],
        [ 0.0075,  0.1211],
        [-0.0026,  0.3148],
        [ 0.1701,  0.1339],
        [ 0.0007,  0.1959],
        [-0.0512,  0.1868],
        [-0.0316,  0.0786],
        [ 0.0957,  0.1336],
        [ 0.0029,  0.1467],
        [ 0.0204,  0.1994],
        [-0.1994,  0.2708]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0400,  0.2962],
        [-0.0556,  0.2859],
        [ 0.0195,  0.2572],
        [-0.0434,  0.2041],
        [-0.1063,  0.3904],
        [-0.0070,  0.2863],
        [-0.1113,  0.1923],
        [-0.0841,  0.1742],
        [-0.0356,  0.2859],
        [-0.1885,  0.3797],
        [-0.0666,  0.1738],
        [ 0.0111,  0.1248]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.2001,  0.3664],
        [ 0.1523,  0.1015],
        [ 0.1308, -0.0624],
        [ 0.0585,  0.0689],
        [-0.0881,  0.1661],
        [ 0.0636,  0.2619],
        [-0.0562,  0.1591],
        [-0.1530,  0.3502],
        [-0.0231,  0.1808],
        [-0.1313,  0.2723],
        [ 0.0580,  0.1947],
        [ 0.0177,  0.2256]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0109,  0.1706],
        [-0.0253,  0.2339],
        [-0.2033,  0.2493],
        [-0.2496,  0.3665],
        [ 0.1025,  0.1139],
        [ 0.2373,  0.1314],
        [-0.0662,  0.2129],
        [ 0.0595,  0.2345],
        [ 0.0263,  0.1958],
        [-0.1067,  0.2862],
        [ 0.0203,  0.2171],
        [-0.0383,  0.2086]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1081,  0.3301],
        [ 0.0182,  0.2056],
        [ 0.2267,  0.0758],
        [-0.0825,  0.1854],
        [-0.1684,  0.2011],
        [ 0.0741,  0.0777],
        [-0.1877,  0.3090],
        [-0.0928,  0.3078],
        [ 0.0714,  0.1361],
        [ 0.1522,  0.2914],
        [-0.1853,  0.2620],
        [ 0.1150,  0.0607]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.2158,  0.3341],
        [-0.0932,  0.2084],
        [ 0.1670,  0.0452],
        [-0.2532,  0.4038],
        [ 0.0651,  0.1558],
        [ 0.2527, -0.0841],
        [ 0.0605,  0.2094],
        [ 0.0089,  0.0977],
        [ 0.0303,  0.2434],
        [-0.0545,  0.1237],
        [-0.2295,  0.4028],
        [-0.0259,  0.1566]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0871,  0.1775],
        [-0.0645,  0.3247],
        [-0.2000,  0.2962],
        [ 0.1689,  0.0775],
        [ 0.1630,  0.0703],
        [-0.1118,  0.2190],
        [-0.1666,  0.3106],
        [ 0.0904,  0.1011],
        [-0.0624,  0.3063],
        [ 0.1007,  0.1613],
        [-0.1008,  0.3984],
        [-0.1138,  0.1121]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 1.1193e-01,  3.7968e-02],
        [ 2.2283e-01, -3.2262e-04],
        [ 1.5096e-02,  1.3003e-01],
        [ 5.9033e-02,  1.8355e-02],
        [-7.8059e-02,  2.2360e-01],
        [-2.3928e-02,  2.9257e-01],
        [-1.4160e-01,  3.0212e-01],
        [ 1.6461e-01,  1.0569e-01],
        [-1.2312e-01,  3.9479e-01],
        [-2.1712e-03,  1.8309e-01],
        [-4.5715e-02,  2.1839e-01],
        [ 1.7632e-01,  5.7306e-02]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1913,  0.3139],
        [-0.0115,  0.2578],
        [-0.1492,  0.2040],
        [ 0.1830,  0.1021],
        [-0.0312,  0.1268],
        [ 0.1266,  0.0708],
        [-0.1870,  0.3273],
        [ 0.0635,  0.1520],
        [-0.1067,  0.3023],
        [ 0.0689,  0.1212],
        [-0.0159,  0.2832],
        [ 0.0373,  0.2255]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0674,  0.1172],
        [-0.1543,  0.2477],
        [ 0.0093,  0.2155],
        [-0.0535,  0.1768],
        [ 0.1065,  0.1874],
        [ 0.2271, -0.0208],
        [-0.1705,  0.3167],
        [ 0.1832, -0.0598],
        [-0.0532,  0.0926],
        [-0.0443,  0.2571],
        [ 0.1074,  0.1481],
        [ 0.0353,  0.1077]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0350,  0.2049],
        [-0.0102,  0.0493],
        [ 0.0487,  0.2012],
        [ 0.0089,  0.0809],
        [ 0.0576,  0.1414],
        [ 0.2367, -0.0506],
        [-0.0376,  0.0689],
        [-0.0715,  0.3570],
        [ 0.2058,  0.0468],
        [ 0.0597,  0.2265],
        [ 0.0940,  0.2761],
        [ 0.0803,  0.1376]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0406,  0.0235],
        [-0.0213,  0.1177],
        [-0.0121,  0.1842],
        [-0.0171,  0.2211],
        [ 0.0512,  0.0583],
        [ 0.0653,  0.2616],
        [-0.0314,  0.2514],
        [-0.0672,  0.1334],
        [-0.0898,  0.2510],
        [-0.0226,  0.2030],
        [ 0.0340,  0.2421],
        [-0.0802,  0.3092]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0871,  0.1079],
        [-0.0680,  0.1942],
        [-0.0234,  0.2882],
        [-0.0821,  0.2403],
        [-0.1699,  0.3035],
        [-0.0871,  0.2685],
        [-0.0341,  0.2711],
        [-0.0772,  0.3086],
        [ 0.0377,  0.2188],
        [-0.1292,  0.3360],
        [-0.1015,  0.2778],
        [ 0.0037,  0.2768]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0147,  0.2834],
        [ 0.2471, -0.1252],
        [ 0.0644,  0.1266],
        [ 0.1251,  0.0881],
        [-0.1132,  0.2436],
        [ 0.1127,  0.2438],
        [-0.0974,  0.2174],
        [-0.0622,  0.3230],
        [ 0.0305,  0.0766],
        [ 0.0248,  0.1309],
        [ 0.0876,  0.1980],
        [ 0.2226,  0.0287]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0214,  0.1834],
        [-0.1462,  0.3947],
        [-0.1501,  0.3414],
        [-0.2100,  0.3882],
        [ 0.1965, -0.0240],
        [ 0.1858, -0.0166],
        [-0.1758,  0.3210],
        [ 0.1010,  0.1121],
        [ 0.0220,  0.2743],
        [-0.0217,  0.3386],
        [ 0.1086,  0.0852],
        [ 0.1356,  0.2179]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0698,  0.1452],
        [-0.0531,  0.2471],
        [-0.1169,  0.2360],
        [ 0.0561,  0.1757],
        [-0.0553,  0.3413],
        [-0.0184,  0.2122],
        [-0.0592,  0.3276],
        [-0.1482,  0.3668],
        [-0.0807,  0.2840],
        [ 0.0272,  0.1633],
        [-0.1861,  0.2698],
        [ 0.0439,  0.0991]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1377,  0.2793],
        [-0.0480,  0.0673],
        [ 0.1255,  0.0859],
        [-0.2069,  0.3490],
        [ 0.0821,  0.1507],
        [ 0.3041, -0.0006],
        [ 0.0834,  0.1706],
        [ 0.1809,  0.0705],
        [ 0.1530,  0.1289],
        [ 0.0258,  0.1410],
        [-0.0979,  0.3973],
        [ 0.0087,  0.2525]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1306,  0.1640],
        [-0.0078,  0.2100],
        [-0.1867,  0.3036],
        [ 0.1401,  0.0232],
        [ 0.1160,  0.0775],
        [-0.1008,  0.3747],
        [-0.1444,  0.3144],
        [-0.0189,  0.2698],
        [-0.1786,  0.3501],
        [ 0.0399,  0.2161],
        [-0.1026,  0.4172],
        [ 0.0636,  0.1458]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0516,  0.1730],
        [ 0.0765,  0.0968],
        [ 0.0549,  0.1398],
        [-0.0778,  0.1502],
        [-0.0285,  0.1745],
        [-0.0956,  0.2963],
        [-0.0691,  0.3113],
        [ 0.0970,  0.1519],
        [ 0.0211,  0.3362],
        [-0.0192,  0.2705],
        [-0.0108,  0.1336],
        [ 0.1026,  0.1685]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1634,  0.2279],
        [-0.2468,  0.2727],
        [-0.1006,  0.3410],
        [-0.0341,  0.1719],
        [ 0.2054,  0.1279],
        [ 0.3109, -0.0413],
        [-0.0415,  0.3095],
        [-0.2528,  0.3492],
        [-0.1381,  0.2356],
        [ 0.0066,  0.1272],
        [-0.0811,  0.3384],
        [ 0.0510,  0.2283]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0519,  0.1638],
        [-0.0736,  0.3272],
        [-0.0542,  0.2669],
        [ 0.0444,  0.1810],
        [-0.0247,  0.2548],
        [ 0.1161,  0.0505],
        [-0.1118,  0.2991],
        [ 0.1772,  0.0721],
        [ 0.0602,  0.1583],
        [-0.0794,  0.2654],
        [-0.0703,  0.2316],
        [ 0.1544, -0.0357]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1213,  0.0672],
        [-0.0538,  0.2637],
        [-0.0513,  0.2133],
        [-0.0591,  0.0905],
        [-0.1595,  0.3238],
        [ 0.0814,  0.0081],
        [-0.0543,  0.2655],
        [-0.1015,  0.2785],
        [-0.0648,  0.2590],
        [ 0.0751,  0.2932],
        [ 0.0861,  0.1077],
        [-0.0041,  0.1585]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0391,  0.0709],
        [ 0.1264,  0.0502],
        [ 0.0533,  0.1515],
        [ 0.0257,  0.2771],
        [ 0.1450, -0.0509],
        [ 0.1828,  0.0639],
        [-0.0081,  0.1085],
        [ 0.0175,  0.0978],
        [ 0.2108,  0.1053],
        [ 0.2477, -0.0117],
        [ 0.0865,  0.0269],
        [ 0.0787,  0.2045]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0025,  0.2010],
        [-0.0781,  0.2818],
        [ 0.0180,  0.2329],
        [ 0.0667,  0.2014],
        [-0.0211,  0.2860],
        [-0.0025,  0.3628],
        [ 0.0008,  0.2431],
        [-0.2215,  0.3453],
        [-0.0048,  0.1742],
        [-0.1272,  0.3517],
        [-0.1885,  0.2863],
        [-0.0428,  0.3146]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.0190,  0.3446],
        [ 0.1597,  0.1314],
        [ 0.0939,  0.2497],
        [ 0.1117,  0.1518],
        [-0.2195,  0.2461],
        [ 0.1460,  0.0394],
        [-0.0234,  0.2960],
        [ 0.0674,  0.0621],
        [ 0.0314,  0.1223],
        [ 0.1738,  0.1096],
        [ 0.1054,  0.2075],
        [ 0.2194, -0.0298]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0746,  0.1757],
        [-0.1153,  0.2129],
        [-0.1200,  0.2681],
        [ 0.0724,  0.1388],
        [ 0.2131,  0.0577],
        [ 0.2610,  0.0213],
        [-0.1428,  0.3067],
        [ 0.0062,  0.1720],
        [ 0.1508,  0.1489],
        [-0.0456,  0.2640],
        [ 0.0271,  0.1105],
        [ 0.0027,  0.2420]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0754,  0.2334],
        [ 0.1820,  0.0742],
        [ 0.0621,  0.1372],
        [-0.0992,  0.2384],
        [ 0.0251,  0.2101],
        [ 0.0942,  0.0313],
        [-0.0906,  0.2566],
        [-0.0641,  0.1561],
        [ 0.1717, -0.0085],
        [ 0.1908,  0.0613],
        [-0.0995,  0.2803],
        [ 0.1665,  0.1333]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1052,  0.3806],
        [ 0.0108,  0.2450],
        [ 0.0696,  0.0682],
        [-0.1912,  0.3879],
        [ 0.0849,  0.0578],
        [ 0.3402, -0.0498],
        [ 0.0717,  0.2724],
        [-0.0427,  0.1700],
        [ 0.1233,  0.0252],
        [-0.0037,  0.1963],
        [-0.1285,  0.2628],
        [ 0.0841,  0.0906]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1815,  0.1402],
        [ 0.2117, -0.0320],
        [ 0.0753,  0.2577],
        [ 0.2049,  0.0515],
        [ 0.2422,  0.1445],
        [ 0.0212,  0.1525],
        [-0.0945,  0.2138],
        [ 0.1906,  0.0993],
        [-0.0705,  0.1607],
        [ 0.2455, -0.0500],
        [ 0.1401,  0.1151],
        [ 0.0918,  0.2100]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.1253,  0.0324],
        [ 0.1910,  0.1448],
        [ 0.1872,  0.0685],
        [ 0.1492,  0.0627],
        [ 0.1578,  0.0678],
        [ 0.0135,  0.2094],
        [-0.0057,  0.2589],
        [ 0.1745,  0.1085],
        [ 0.1915,  0.1701],
        [ 0.3042,  0.0079],
        [-0.0574,  0.1412],
        [ 0.0274,  0.2087]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-1.0444e-01,  1.8906e-01],
        [ 1.0800e-01,  1.3671e-01],
        [-8.9049e-02,  3.1221e-01],
        [ 1.3171e-01,  1.1431e-01],
        [ 1.4396e-02,  3.1804e-01],
        [ 1.7262e-01,  2.6610e-02],
        [-1.8938e-01,  2.4644e-01],
        [ 1.0374e-01,  2.0895e-01],
        [-1.4511e-01,  3.5791e-01],
        [-2.5765e-04,  2.0545e-01],
        [-5.9462e-02,  2.1274e-01],
        [-7.8978e-02,  2.4045e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1128,  0.0692],
        [-0.1434,  0.1837],
        [ 0.0560,  0.2238],
        [-0.0270,  0.3982],
        [-0.0104,  0.2166],
        [ 0.1557, -0.0348],
        [-0.0231,  0.1349],
        [ 0.3703, -0.0703],
        [ 0.0152,  0.1900],
        [ 0.0156,  0.2247],
        [ 0.0763,  0.3005],
        [ 0.0755,  0.1980]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0374,  0.1901],
        [ 0.1265, -0.1081],
        [-0.0936,  0.2287],
        [-0.0306,  0.1884],
        [ 0.0424,  0.1933],
        [ 0.2538,  0.1101],
        [ 0.1136,  0.1979],
        [-0.0638,  0.2744],
        [ 0.0084,  0.2400],
        [ 0.0116,  0.0247],
        [ 0.0296,  0.3242],
        [-0.0816,  0.1814]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0748,  0.2609],
        [-0.0736,  0.3003],
        [ 0.2274,  0.1555],
        [ 0.0395,  0.2586],
        [ 0.1552,  0.0680],
        [-0.0287,  0.0781],
        [-0.0291,  0.2044],
        [-0.0071,  0.2028],
        [ 0.0641,  0.1665],
        [ 0.0186,  0.0437],
        [ 0.0716,  0.1907],
        [-0.1643,  0.4129]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0399,  0.0803],
        [ 0.0434,  0.2284],
        [-0.0147,  0.2564],
        [-0.0363,  0.1894],
        [-0.0733,  0.3386],
        [ 0.0368,  0.3501],
        [-0.1269,  0.2142],
        [-0.0461,  0.1825],
        [ 0.1235,  0.2331],
        [-0.1212,  0.3512],
        [-0.0294,  0.2124],
        [ 0.1579,  0.0688]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0806,  0.2623],
        [ 0.0491,  0.0031],
        [ 0.0810,  0.0627],
        [ 0.1460,  0.1350],
        [-0.1743,  0.3243],
        [ 0.1035,  0.1663],
        [-0.0999,  0.2558],
        [-0.2363,  0.3023],
        [-0.0249,  0.3116],
        [ 0.0865,  0.1432],
        [ 0.0343,  0.1801],
        [ 0.0350,  0.2789]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0423,  0.0921],
        [-0.1590,  0.3982],
        [-0.1557,  0.3623],
        [ 0.0442,  0.2538],
        [ 0.2778,  0.0836],
        [ 0.2365, -0.0255],
        [-0.0668,  0.1742],
        [ 0.1120,  0.0960],
        [ 0.1708,  0.0988],
        [-0.1045,  0.3847],
        [ 0.0781,  0.1200],
        [ 0.0300,  0.2427]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0144,  0.2601],
        [ 0.1167,  0.0527],
        [-0.0817,  0.2163],
        [ 0.0191,  0.0223],
        [-0.0712,  0.2218],
        [ 0.0007,  0.1318],
        [-0.0946,  0.1944],
        [-0.1670,  0.3603],
        [ 0.0269,  0.1502],
        [ 0.3640, -0.1331],
        [-0.1248,  0.3062],
        [ 0.0305,  0.1989]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1203,  0.3068],
        [-0.0791,  0.1826],
        [ 0.0625,  0.0588],
        [-0.1047,  0.3689],
        [ 0.0696,  0.1606],
        [ 0.3831, -0.0333],
        [-0.0299,  0.3289],
        [-0.0493,  0.1814],
        [ 0.0553,  0.0717],
        [-0.0927,  0.1925],
        [-0.1762,  0.2274],
        [ 0.1047,  0.1441]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1329,  0.2098],
        [-0.0074,  0.1392],
        [-0.0610,  0.2933],
        [ 0.0144,  0.2155],
        [ 0.1247, -0.0412],
        [-0.1446,  0.3142],
        [-0.3001,  0.4339],
        [ 0.0962,  0.1085],
        [-0.0283,  0.2747],
        [-0.0170,  0.0662],
        [-0.0005,  0.2611],
        [ 0.0615,  0.1176]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0051,  0.2034],
        [ 0.1419,  0.1130],
        [ 0.0267,  0.2036],
        [ 0.0230,  0.1648],
        [ 0.0898,  0.2337],
        [-0.0551,  0.2787],
        [-0.1606,  0.2413],
        [ 0.0893,  0.1435],
        [ 0.0349,  0.2648],
        [ 0.2003, -0.1155],
        [ 0.0555,  0.2282],
        [ 0.2488,  0.1028]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1639,  0.2446],
        [-0.0240,  0.1424],
        [ 0.0910,  0.0583],
        [ 0.1846,  0.0564],
        [ 0.1550,  0.0432],
        [ 0.0353,  0.1951],
        [-0.2934,  0.2850],
        [-0.0279,  0.2155],
        [-0.0132,  0.2196],
        [-0.0132,  0.1978],
        [ 0.0716,  0.1230],
        [-0.1515,  0.2228]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0229,  0.2626],
        [-0.0791,  0.2039],
        [-0.0697,  0.3183],
        [-0.1048,  0.2561],
        [-0.0443,  0.2367],
        [ 0.0149,  0.2646],
        [-0.0096,  0.1742],
        [ 0.2345,  0.0873],
        [ 0.1765,  0.0968],
        [-0.1654,  0.4183],
        [-0.0430,  0.3483],
        [ 0.0968,  0.0825]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0659,  0.0769],
        [ 0.0044,  0.1320],
        [-0.0317,  0.2249],
        [ 0.0350,  0.0888],
        [ 0.0343,  0.1654],
        [ 0.0198,  0.2297],
        [ 0.1697,  0.0177],
        [-0.3743,  0.4536],
        [ 0.1797,  0.1234],
        [-0.0327,  0.1801],
        [ 0.1420,  0.0567],
        [-0.0664,  0.2221]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1274,  0.3159],
        [ 0.0514,  0.1420],
        [-0.0977,  0.3849],
        [ 0.0523,  0.1777],
        [ 0.1513,  0.1393],
        [ 0.1465,  0.1535],
        [-0.0232,  0.3640],
        [-0.0264,  0.2264],
        [-0.1051,  0.2581],
        [ 0.1192,  0.1696],
        [ 0.0775,  0.1597],
        [-0.1539,  0.3414]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0941,  0.1737],
        [-0.0681,  0.2562],
        [-0.0604,  0.2842],
        [-0.0999,  0.1443],
        [-0.2433,  0.3371],
        [-0.0774,  0.2131],
        [-0.2510,  0.3305],
        [-0.0569,  0.2756],
        [-0.0522,  0.2820],
        [-0.1841,  0.3894],
        [-0.1106,  0.3033],
        [-0.0602,  0.1450]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1842,  0.3198],
        [ 0.0352,  0.1692],
        [ 0.0646,  0.2367],
        [ 0.0755,  0.0597],
        [-0.2928,  0.4978],
        [ 0.0669,  0.1889],
        [-0.2374,  0.3298],
        [-0.0652,  0.2758],
        [-0.2176,  0.3869],
        [ 0.0020,  0.1796],
        [-0.0670,  0.3276],
        [ 0.1481, -0.0318]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0092,  0.2368],
        [-0.0397,  0.3477],
        [ 0.0131,  0.2345],
        [-0.2700,  0.2915],
        [ 0.2641,  0.0156],
        [ 0.0872,  0.1600],
        [ 0.0101,  0.1934],
        [ 0.1386,  0.0888],
        [ 0.0669,  0.1929],
        [-0.2422,  0.3207],
        [-0.0724,  0.2649],
        [-0.0144,  0.1944]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0287,  0.3147],
        [ 0.1408,  0.0170],
        [ 0.0161,  0.2404],
        [ 0.0391,  0.2006],
        [-0.0864,  0.2814],
        [ 0.1567, -0.0322],
        [-0.0544,  0.2644],
        [-0.0925,  0.2167],
        [-0.0662,  0.2266],
        [ 0.0239,  0.1565],
        [-0.1998,  0.5779],
        [ 0.0522,  0.1236]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0143,  0.2530],
        [-0.0526,  0.1116],
        [ 0.0740,  0.0941],
        [-0.3086,  0.4414],
        [ 0.0226,  0.1992],
        [ 0.2221, -0.0399],
        [ 0.0911,  0.2221],
        [ 0.0844,  0.0205],
        [ 0.1861,  0.1333],
        [ 0.0068,  0.1694],
        [-0.1979,  0.3741],
        [ 0.0392,  0.0985]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0984,  0.1301],
        [ 0.0454,  0.2021],
        [-0.0947,  0.2155],
        [-0.0288,  0.2314],
        [ 0.1525, -0.0415],
        [-0.0654,  0.3253],
        [-0.1968,  0.3255],
        [-0.0200,  0.2447],
        [-0.1979,  0.3053],
        [ 0.0942,  0.1789],
        [-0.1437,  0.3525],
        [-0.0021,  0.1794]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0818,  0.0784],
        [ 0.0496,  0.2702],
        [ 0.2923, -0.0460],
        [ 0.0477,  0.1674],
        [ 0.0858,  0.1504],
        [ 0.1203,  0.2125],
        [ 0.0033,  0.1067],
        [ 0.0075,  0.1327],
        [ 0.0335,  0.2161],
        [ 0.1581,  0.0956],
        [ 0.0460,  0.1928],
        [ 0.1250,  0.1348]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.2166,  0.3237],
        [ 0.0383,  0.1940],
        [-0.0337,  0.2441],
        [-0.0444,  0.0706],
        [ 0.0317,  0.1580],
        [ 0.1008,  0.0991],
        [-0.2776,  0.3852],
        [-0.1331,  0.3090],
        [-0.1045,  0.1912],
        [-0.0096,  0.2307],
        [-0.0842,  0.2862],
        [ 0.0799,  0.0826]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.1136,  0.1363],
        [-0.3120,  0.4027],
        [-0.1259,  0.3076],
        [-0.1739,  0.3459],
        [-0.0353,  0.2794],
        [ 0.1416,  0.0368],
        [-0.1722,  0.4051],
        [ 0.2044,  0.0253],
        [-0.0474,  0.1613],
        [-0.1641,  0.3871],
        [ 0.0205,  0.1509],
        [ 0.0982,  0.0523]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0165,  0.1486],
        [-0.0144,  0.1794],
        [ 0.0404,  0.2248],
        [-0.0671,  0.1961],
        [ 0.0032,  0.2488],
        [ 0.0139,  0.1288],
        [-0.0767,  0.1863],
        [-0.1303,  0.2718],
        [-0.0810,  0.2617],
        [ 0.1200,  0.0727],
        [ 0.0441,  0.1961],
        [-0.0736,  0.0282]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0348,  0.2474],
        [ 0.0053,  0.2584],
        [ 0.0296,  0.1545],
        [-0.0529,  0.1959],
        [-0.0719,  0.2944],
        [ 0.0759,  0.1195],
        [-0.0496,  0.2370],
        [ 0.0582, -0.0245],
        [-0.1040,  0.3511],
        [ 0.1290,  0.2036],
        [ 0.1315,  0.1345],
        [ 0.0368,  0.1927]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0120,  0.1360],
        [ 0.0028,  0.1871],
        [-0.1160,  0.4119],
        [-0.0608,  0.2802],
        [-0.0405,  0.2088],
        [ 0.0421,  0.2754],
        [-0.2952,  0.3073],
        [-0.2088,  0.3386],
        [-0.1526,  0.2690],
        [-0.1748,  0.3571],
        [-0.2279,  0.3811],
        [ 0.1168,  0.0733]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1508,  0.2861],
        [ 0.0160,  0.1864],
        [-0.0232,  0.2454],
        [-0.0954,  0.1752],
        [-0.3240,  0.4006],
        [-0.0576,  0.2359],
        [-0.1310,  0.2762],
        [-0.1163,  0.2843],
        [-0.1833,  0.2036],
        [-0.1924,  0.3377],
        [ 0.0749,  0.1540],
        [ 0.0153,  0.2836]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.3262,  0.2679],
        [-0.0748,  0.2195],
        [-0.3699,  0.4105],
        [-0.1906,  0.2516],
        [ 0.2661,  0.0270],
        [-0.0538,  0.2176],
        [-0.0997,  0.1951],
        [-0.0305,  0.1385],
        [-0.0388,  0.2544],
        [-0.2106,  0.4892],
        [-0.0296,  0.2604],
        [-0.1570,  0.2930]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0785,  0.2393],
        [-0.0539, -0.0223],
        [-0.0184,  0.2556],
        [ 0.0552,  0.1678],
        [-0.0428,  0.2395],
        [ 0.0636,  0.1349],
        [-0.2132,  0.1818],
        [-0.0662,  0.3299],
        [-0.1711,  0.3088],
        [ 0.1903,  0.0574],
        [-0.3369,  0.4210],
        [ 0.0475,  0.1681]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1710,  0.2379],
        [-0.0855,  0.1518],
        [ 0.1360,  0.0598],
        [-0.2952,  0.4019],
        [-0.0930,  0.2903],
        [ 0.2405,  0.0071],
        [ 0.0016,  0.1811],
        [-0.0179,  0.1764],
        [-0.0539,  0.3274],
        [ 0.1273,  0.1368],
        [-0.2549,  0.3532],
        [-0.0472,  0.2284]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.1669,  0.4204],
        [ 0.0093,  0.1291],
        [-0.2201,  0.2989],
        [-0.0920,  0.3106],
        [ 0.1487,  0.0152],
        [-0.1376,  0.2225],
        [-0.3033,  0.4132],
        [ 0.0143,  0.1156],
        [-0.2236,  0.3542],
        [-0.0326,  0.1834],
        [-0.1091,  0.2308],
        [ 0.0236,  0.2843]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0771,  0.0800],
        [ 0.0017,  0.2139],
        [ 0.1763,  0.0514],
        [-0.1751,  0.1491],
        [ 0.1710,  0.1135],
        [ 0.0149,  0.2058],
        [-0.0789,  0.3265],
        [-0.0212,  0.0835],
        [-0.0318,  0.0558],
        [ 0.1849,  0.1491],
        [-0.1035,  0.3054],
        [ 0.1217,  0.2143]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[ 0.0103,  0.0759],
        [-0.1388,  0.1198],
        [-0.0745,  0.2067],
        [ 0.0310,  0.1446],
        [-0.1981,  0.3259],
        [ 0.1069,  0.1055],
        [-0.2296,  0.4551],
        [-0.1142,  0.3314],
        [-0.1271,  0.2141],
        [ 0.0318,  0.2014],
        [-0.1477,  0.2423],
        [ 0.0088,  0.1416]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0837,  0.1075],
        [-0.1366,  0.1287],
        [-0.0770,  0.2515],
        [-0.1126,  0.1542],
        [ 0.0102,  0.3195],
        [ 0.2302,  0.0093],
        [-0.1106,  0.2316],
        [ 0.2388, -0.0134],
        [-0.0822,  0.1914],
        [-0.1106,  0.2707],
        [ 0.1499,  0.0791],
        [ 0.0951,  0.0989]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1478,  0.0472],
        [ 0.0355,  0.1586],
        [ 0.0031,  0.2556],
        [ 0.0275,  0.1840],
        [-0.0960,  0.2851],
        [-0.0299,  0.1445],
        [ 0.1334,  0.1574],
        [ 0.0355,  0.2003],
        [-0.0290,  0.2724],
        [-0.1146,  0.2761],
        [ 0.0584,  0.0532],
        [ 0.0719,  0.1110]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0491,  0.1488],
        [-0.0430,  0.1101],
        [-0.1249,  0.1677],
        [ 0.0142,  0.1550],
        [ 0.1390,  0.1814],
        [ 0.1531,  0.0827],
        [-0.1623,  0.2428],
        [-0.0265,  0.2156],
        [-0.2106,  0.4009],
        [ 0.0370,  0.0832],
        [ 0.0220,  0.1491],
        [-0.2068,  0.3164]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.2387, -0.0125],
        [-0.0906,  0.2833],
        [ 0.0204,  0.2826],
        [-0.1449,  0.2416],
        [-0.1437,  0.2609],
        [-0.1054,  0.3969],
        [-0.1945,  0.2872],
        [-0.1099,  0.2750],
        [-0.0832,  0.2767],
        [-0.1760,  0.3048],
        [-0.0753,  0.4206],
        [ 0.2055,  0.1449]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1952,  0.3602],
        [ 0.0941, -0.0048],
        [-0.1008,  0.2169],
        [-0.1034,  0.2428],
        [-0.1712,  0.2868],
        [ 0.0702, -0.0087],
        [-0.2970,  0.5185],
        [-0.2348,  0.3093],
        [-0.1909,  0.4404],
        [-0.1101,  0.4251],
        [-0.1232,  0.2585],
        [ 0.1342,  0.1025]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.2134,  0.2811],
        [-0.0411,  0.2258],
        [-0.2323,  0.2956],
        [-0.1297,  0.2889],
        [ 0.3897, -0.1452],
        [ 0.0862,  0.0690],
        [-0.0783,  0.2187],
        [-0.0784,  0.2964],
        [ 0.0899,  0.1437],
        [ 0.0432,  0.2196],
        [ 0.2252,  0.1199],
        [ 0.0263,  0.2217]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.1507,  0.3127],
        [ 0.0016,  0.2760],
        [ 0.0149,  0.0986],
        [ 0.1612,  0.0627],
        [-0.0935,  0.1613],
        [ 0.1455,  0.0219],
        [-0.0979,  0.1587],
        [-0.0381,  0.1292],
        [ 0.0774,  0.0954],
        [ 0.3475, -0.1129],
        [ 0.0014,  0.1400],
        [ 0.0879,  0.1537]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0593,  0.2258],
        [-0.2716,  0.2662],
        [ 0.0815,  0.1711],
        [-0.2492,  0.4103],
        [ 0.0275,  0.1495],
        [ 0.2218, -0.0413],
        [ 0.1404,  0.1481],
        [ 0.0095,  0.1481],
        [ 0.1087,  0.1213],
        [ 0.0630,  0.1080],
        [-0.1860,  0.3875],
        [-0.0852,  0.1681]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0856,  0.1735],
        [-0.0694,  0.2022],
        [-0.1476,  0.3021],
        [-0.0786,  0.1832],
        [ 0.1900, -0.0100],
        [-0.1239,  0.2757],
        [-0.2479,  0.3873],
        [-0.2721,  0.5048],
        [-0.1233,  0.3109],
        [ 0.1648,  0.0198],
        [-0.2106,  0.2869],
        [-0.1570,  0.1523]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0761,  0.2039],
        [-0.1318,  0.2694],
        [-0.1194,  0.2294],
        [-0.1833,  0.2427],
        [-0.1220,  0.3141],
        [ 0.0640,  0.1447],
        [-0.2559,  0.2817],
        [-0.1405,  0.2212],
        [-0.1417,  0.2297],
        [-0.0038,  0.2866],
        [ 0.0297,  0.2070],
        [ 0.0076,  0.3239]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.2659,  0.3662],
        [-0.1582,  0.2308],
        [-0.0946,  0.3457],
        [ 0.0432,  0.0120],
        [ 0.1604,  0.0904],
        [-0.0256,  0.2081],
        [-0.2824,  0.3627],
        [-0.1816,  0.2870],
        [-0.0467,  0.2065],
        [-0.2443,  0.4559],
        [-0.3348,  0.4553],
        [ 0.0495,  0.2380]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.1657,  0.2141],
        [-0.3694,  0.4292],
        [-0.0541,  0.4322],
        [-0.2519,  0.3077],
        [-0.0206,  0.2618],
        [-0.1042,  0.2001],
        [-0.2915,  0.4742],
        [ 0.2458,  0.1561],
        [ 0.0416,  0.1501],
        [-0.3332,  0.3159],
        [-0.0673,  0.3219],
        [-0.0285,  0.2092]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.1328,  0.2264],
        [ 0.0037,  0.0738],
        [-0.1343,  0.4181],
        [-0.2207,  0.3117],
        [-0.0762,  0.2771],
        [ 0.1874,  0.1113],
        [-0.1122,  0.3323],
        [-0.2843,  0.3649],
        [-0.2382,  0.4287],
        [-0.1472,  0.3487],
        [-0.1523,  0.3509],
        [-0.2258,  0.3343]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1244,  0.0205],
        [ 0.0320,  0.1369],
        [-0.2756,  0.3201],
        [ 0.0762,  0.1490],
        [-0.1572,  0.2352],
        [ 0.0929, -0.0479],
        [ 0.1919,  0.0167],
        [-0.0349,  0.1605],
        [ 0.0797,  0.2390],
        [ 0.1097,  0.0087],
        [ 0.2109,  0.0586],
        [-0.0673,  0.1442]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0416,  0.0593],
        [ 0.1103,  0.0170],
        [-0.0514,  0.1583],
        [-0.0190,  0.1208],
        [-0.1618,  0.3596],
        [-0.1645,  0.2991],
        [-0.0533,  0.1591],
        [ 0.0591,  0.1878],
        [-0.0974,  0.1105],
        [ 0.1088,  0.1735],
        [-0.1247,  0.1991],
        [ 0.0813,  0.2420]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0199,  0.1528],
        [ 0.1080,  0.0516],
        [ 0.3794, -0.0814],
        [ 0.1872, -0.1041],
        [-0.2942,  0.3383],
        [ 0.2670, -0.0760],
        [-0.0584,  0.2334],
        [-0.2147,  0.2885],
        [-0.0290,  0.2183],
        [ 0.0573,  0.1264],
        [ 0.2013,  0.0413],
        [ 0.2187, -0.1164]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0761,  0.0708],
        [ 0.0259,  0.1819],
        [-0.1373,  0.2339],
        [-0.0875,  0.3801],
        [ 0.2812, -0.1152],
        [ 0.0246,  0.1235],
        [-0.0694,  0.1115],
        [ 0.1944,  0.0631],
        [ 0.1535,  0.1528],
        [-0.0154,  0.3327],
        [-0.0330,  0.2574],
        [-0.0286,  0.1645]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0644,  0.2440],
        [ 0.0985,  0.0588],
        [-0.0682,  0.2138],
        [-0.1631,  0.2719],
        [-0.1525,  0.1688],
        [ 0.0948,  0.0196],
        [-0.0968,  0.1482],
        [-0.0853,  0.1800],
        [ 0.0719,  0.0289],
        [ 0.1788,  0.0491],
        [-0.1335,  0.3288],
        [ 0.0556,  0.0091]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.2168,  0.2966],
        [-0.0350,  0.2772],
        [-0.0063,  0.2101],
        [-0.2431,  0.2807],
        [ 0.0845, -0.0040],
        [ 0.2493, -0.0610],
        [ 0.1112,  0.1315],
        [-0.0137,  0.0380],
        [ 0.0577,  0.2072],
        [ 0.0403,  0.1103],
        [-0.1601,  0.2565],
        [-0.0323,  0.4041]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.2589,  0.4647],
        [-0.2795,  0.3145],
        [-0.2955,  0.3584],
        [-0.3016,  0.4648],
        [ 0.0631,  0.1838],
        [-0.3048,  0.4792],
        [-0.5343,  0.6040],
        [-0.3417,  0.4746],
        [-0.2945,  0.4355],
        [-0.0577,  0.2212],
        [-0.1912,  0.2584],
        [-0.2363,  0.3662]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0256,  0.2108],
        [-0.1164,  0.3989],
        [ 0.1021,  0.0121],
        [-0.0521,  0.1903],
        [ 0.0779,  0.2901],
        [-0.2822,  0.4521],
        [-0.3214,  0.4002],
        [-0.1967,  0.2960],
        [-0.0719,  0.2869],
        [ 0.1175,  0.0852],
        [-0.1913,  0.2772],
        [-0.1783,  0.3491]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1098,  0.2060],
        [-0.1158,  0.2039],
        [-0.1594,  0.2250],
        [-0.0468,  0.2901],
        [ 0.0924,  0.1228],
        [ 0.0581,  0.1547],
        [-0.3453,  0.4172],
        [-0.0971,  0.3496],
        [ 0.0823,  0.1160],
        [-0.0147,  0.2530],
        [-0.1751,  0.3103],
        [-0.1075,  0.2446]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0244,  0.1703],
        [-0.3233,  0.4163],
        [ 0.0591,  0.1111],
        [-0.1000,  0.3405],
        [-0.0564,  0.2704],
        [-0.0148,  0.0947],
        [-0.1882,  0.2572],
        [ 0.2554, -0.0877],
        [-0.1287,  0.1645],
        [-0.1652,  0.3283],
        [-0.0812,  0.2409],
        [ 0.0354,  0.1775]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0838,  0.1722],
        [-0.0507,  0.1198],
        [-0.3144,  0.3603],
        [-0.1235,  0.2191],
        [ 0.0460,  0.0972],
        [ 0.1781, -0.0206],
        [-0.1621,  0.1660],
        [-0.2391,  0.2495],
        [-0.0419,  0.2175],
        [-0.0374,  0.1656],
        [ 0.0755,  0.1829],
        [-0.2496,  0.3324]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0030,  0.1388],
        [-0.1598,  0.2604],
        [ 0.0339,  0.0483],
        [-0.2276,  0.2641],
        [-0.0846,  0.2412],
        [ 0.0544,  0.0701],
        [-0.0692,  0.1729],
        [-0.0744,  0.1064],
        [ 0.1203,  0.1149],
        [-0.1013,  0.1673],
        [-0.0816,  0.2952],
        [-0.1946,  0.3703]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0669,  0.1183],
        [-0.2181,  0.3295],
        [ 0.0166,  0.2252],
        [-0.2362,  0.2969],
        [-0.2023,  0.4127],
        [-0.2422,  0.2560],
        [-0.3493,  0.4152],
        [-0.0738,  0.2090],
        [-0.0222,  0.2709],
        [-0.2000,  0.3336],
        [-0.2388,  0.3798],
        [-0.0117,  0.2814]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0692,  0.2394],
        [-0.0962,  0.1633],
        [-0.0131,  0.2096],
        [-0.0864,  0.1751],
        [-0.2372,  0.3583],
        [-0.1401,  0.2190],
        [-0.1875,  0.3172],
        [-0.3331,  0.3952],
        [-0.1173,  0.3016],
        [-0.0542,  0.1332],
        [-0.0602,  0.3179],
        [-0.0771,  0.1004]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0023,  0.2087],
        [-0.4328,  0.5138],
        [-0.2368,  0.2955],
        [-0.1891,  0.2742],
        [ 0.1745,  0.1317],
        [ 0.0153,  0.1662],
        [-0.1632,  0.4658],
        [-0.1071,  0.3388],
        [-0.0717,  0.2180],
        [-0.2016,  0.3332],
        [-0.1712,  0.2724],
        [-0.2385,  0.3611]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-2.2992e-01,  2.1193e-01],
        [-1.1249e-01,  3.3852e-01],
        [-1.6576e-01,  2.8177e-01],
        [ 1.0134e-02,  9.2525e-02],
        [-2.0294e-01,  4.2814e-01],
        [ 1.5628e-02,  2.0882e-02],
        [-1.4551e-01,  3.9104e-01],
        [-2.5963e-01,  3.0703e-01],
        [-1.3728e-01,  3.4041e-01],
        [ 3.4114e-04,  1.8794e-01],
        [-2.1650e-01,  3.4077e-01],
        [ 3.8385e-02,  1.4963e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.3039,  0.3805],
        [-0.1815,  0.2687],
        [ 0.1576, -0.0104],
        [-0.2796,  0.4473],
        [ 0.1688, -0.0173],
        [ 0.3855, -0.0912],
        [-0.0187,  0.2947],
        [-0.1964,  0.1587],
        [ 0.0600,  0.0455],
        [-0.0951,  0.1475],
        [-0.2857,  0.3571],
        [-0.0724,  0.1275]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0622,  0.3854],
        [-0.0515,  0.0649],
        [-0.1250,  0.2328],
        [-0.2086,  0.2417],
        [ 0.1471,  0.0294],
        [-0.2803,  0.3413],
        [-0.3413,  0.3937],
        [-0.1511,  0.2416],
        [ 0.0070,  0.1763],
        [ 0.0905,  0.0558],
        [-0.1285,  0.2551],
        [-0.1442,  0.2454]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0883,  0.2082],
        [ 0.0339,  0.1341],
        [ 0.0481,  0.0230],
        [ 0.0758,  0.1145],
        [-0.0155,  0.1712],
        [-0.0993,  0.2963],
        [-0.1852,  0.2842],
        [-0.1700,  0.2722],
        [-0.0618,  0.2327],
        [-0.1849,  0.2768],
        [-0.1498,  0.2195],
        [-0.0410,  0.2030]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1128,  0.1960],
        [-0.2027,  0.2771],
        [-0.2635,  0.3140],
        [ 0.0771,  0.0243],
        [ 0.0441,  0.1686],
        [-0.1614,  0.3635],
        [-0.3310,  0.5357],
        [-0.2248,  0.4196],
        [-0.2443,  0.3862],
        [-0.0496,  0.1146],
        [-0.2237,  0.3866],
        [-0.0572,  0.1791]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0812,  0.2247],
        [-0.0252,  0.1896],
        [-0.1629,  0.3143],
        [-0.1576,  0.1913],
        [-0.1493,  0.2395],
        [-0.0708,  0.2503],
        [-0.3547,  0.4963],
        [ 0.2509, -0.0325],
        [-0.0523,  0.1969],
        [-0.2406,  0.4509],
        [-0.0568,  0.2453],
        [-0.0217,  0.2331]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.1566,  0.1009],
        [ 0.1584, -0.0009],
        [ 0.0371,  0.1152],
        [-0.0642,  0.1835],
        [ 0.0773,  0.1527],
        [-0.0817,  0.2089],
        [ 0.0601,  0.1341],
        [-0.0549,  0.1778],
        [ 0.0313,  0.2582],
        [ 0.1116,  0.1237],
        [-0.0426,  0.1762],
        [-0.1395,  0.2739]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.0628,  0.1612],
        [-0.2337,  0.2129],
        [-0.0672,  0.3202],
        [-0.0270,  0.2205],
        [ 0.0537,  0.1700],
        [ 0.0694, -0.0207],
        [-0.1874,  0.3527],
        [ 0.0409,  0.2159],
        [ 0.0811,  0.1771],
        [-0.0107,  0.0953],
        [-0.0581,  0.2737],
        [-0.1860,  0.3647]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0236,  0.0942],
        [-0.1871,  0.3335],
        [ 0.0565,  0.1488],
        [-0.1303,  0.2264],
        [-0.0841,  0.2099],
        [-0.0251,  0.2961],
        [-0.1766,  0.3058],
        [-0.1139,  0.1127],
        [-0.1537,  0.3068],
        [-0.1821,  0.3602],
        [-0.0364,  0.2056],
        [ 0.1477,  0.1541]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1547,  0.3495],
        [ 0.0462,  0.1138],
        [-0.0177,  0.1682],
        [-0.1817,  0.1854],
        [-0.3456,  0.3714],
        [-0.1329,  0.2450],
        [-0.2049,  0.2897],
        [-0.3036,  0.3424],
        [-0.2084,  0.4404],
        [-0.1203,  0.2421],
        [ 0.0990,  0.1739],
        [ 0.1446,  0.0357]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-9.4450e-02,  1.5767e-01],
        [-1.8124e-01,  2.8592e-01],
        [-3.1793e-01,  4.3863e-01],
        [-1.2080e-01,  2.9687e-01],
        [ 1.4543e-01,  4.2521e-04],
        [ 1.8376e-02,  5.4637e-02],
        [-9.3854e-02,  2.8872e-01],
        [ 3.0945e-02,  1.8411e-01],
        [ 1.5255e-01,  8.8869e-02],
        [-2.4770e-01,  4.1954e-01],
        [-5.5774e-02,  2.2301e-01],
        [-1.5709e-01,  4.5495e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2554,  0.3389],
        [ 0.0751,  0.0409],
        [-0.0596,  0.1982],
        [ 0.1303,  0.0038],
        [-0.1419,  0.3126],
        [ 0.0940,  0.1597],
        [-0.1986,  0.2620],
        [-0.1707,  0.1461],
        [-0.0334,  0.2482],
        [ 0.2184,  0.0669],
        [-0.2267,  0.1625],
        [ 0.0815,  0.1093]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0474,  0.2729],
        [-0.1444,  0.2512],
        [ 0.1237,  0.1642],
        [ 0.0230,  0.3021],
        [-0.0317,  0.2089],
        [ 0.1938, -0.1364],
        [ 0.2237,  0.1113],
        [-0.2283,  0.3506],
        [ 0.0187,  0.1141],
        [-0.1220,  0.2635],
        [-0.1724,  0.3286],
        [-0.0813,  0.2768]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.2556,  0.4972],
        [ 0.0627,  0.1428],
        [-0.0641,  0.2944],
        [ 0.0199,  0.1348],
        [ 0.0921,  0.0983],
        [-0.0571,  0.2769],
        [-0.5146,  0.5066],
        [ 0.0044,  0.1271],
        [-0.2999,  0.4342],
        [-0.0632,  0.2006],
        [-0.2534,  0.4474],
        [ 0.0634,  0.1632]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0117,  0.1525],
        [-0.0006,  0.2990],
        [-0.0228,  0.1503],
        [-0.1036,  0.2265],
        [-0.0394,  0.2740],
        [-0.0964,  0.2811],
        [-0.1746,  0.2862],
        [-0.1520,  0.4198],
        [ 0.0872,  0.0784],
        [ 0.1061,  0.0134],
        [-0.0454,  0.2005],
        [ 0.2186,  0.2139]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1960,  0.2347],
        [-0.0561,  0.2910],
        [-0.1182,  0.2320],
        [-0.0237,  0.2322],
        [ 0.0807,  0.1242],
        [ 0.0266,  0.1228],
        [-0.4036,  0.5001],
        [-0.1227,  0.1571],
        [-0.0403,  0.2193],
        [-0.1355,  0.2782],
        [-0.2925,  0.4639],
        [-0.1094,  0.3077]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.0132,  0.1865],
        [-0.1962,  0.3294],
        [-0.0314,  0.1782],
        [-0.0796,  0.3342],
        [-0.0789,  0.1412],
        [ 0.0765,  0.1553],
        [-0.2028,  0.3965],
        [ 0.2760, -0.0232],
        [ 0.2624, -0.0340],
        [-0.0403,  0.2624],
        [-0.0725,  0.1513],
        [ 0.0706, -0.0260]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0088,  0.2071],
        [-0.0818,  0.0875],
        [-0.1424,  0.2208],
        [-0.1818,  0.3708],
        [-0.0502,  0.3049],
        [-0.0419,  0.1655],
        [ 0.0863,  0.0473],
        [-0.2915,  0.2799],
        [-0.0693,  0.3357],
        [-0.2572,  0.3721],
        [-0.0543,  0.3106],
        [-0.2390,  0.3320]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1238,  0.2541],
        [-0.0660,  0.2507],
        [ 0.0424,  0.3207],
        [-0.2828,  0.3547],
        [-0.1194,  0.3322],
        [-0.0385,  0.1467],
        [-0.0191,  0.3365],
        [-0.2053,  0.2975],
        [-0.1213,  0.2610],
        [ 0.0832,  0.1060],
        [ 0.0191,  0.1394],
        [-0.2821,  0.4281]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0371,  0.1793],
        [-0.1687,  0.2035],
        [-0.1294,  0.4494],
        [-0.2256,  0.3801],
        [-0.2851,  0.3334],
        [-0.0957,  0.3503],
        [-0.2053,  0.3040],
        [-0.2015,  0.2765],
        [-0.0319,  0.2148],
        [-0.0883,  0.2845],
        [-0.1063,  0.2129],
        [ 0.1291,  0.1230]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1616,  0.3102],
        [ 0.0280,  0.1612],
        [ 0.0564,  0.1942],
        [ 0.0101,  0.1784],
        [-0.2641,  0.3649],
        [ 0.1101, -0.0627],
        [-0.1110,  0.2424],
        [-0.1629,  0.3265],
        [-0.1608,  0.2473],
        [ 0.0161,  0.1694],
        [ 0.0202,  0.1534],
        [ 0.0212,  0.1636]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.1009,  0.2311],
        [-0.2144,  0.3858],
        [-0.2426,  0.4317],
        [-0.1690,  0.2995],
        [ 0.2334, -0.0648],
        [-0.1581,  0.3174],
        [-0.0994,  0.3533],
        [-0.0477,  0.3484],
        [ 0.1450,  0.1334],
        [-0.2737,  0.3693],
        [-0.1942,  0.3663],
        [-0.0304,  0.3966]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.0462,  0.2997],
        [ 0.0460,  0.1929],
        [-0.1016,  0.2650],
        [ 0.1162,  0.0942],
        [-0.0497,  0.2820],
        [ 0.0486,  0.1346],
        [-0.0627,  0.1989],
        [-0.2682,  0.3804],
        [-0.1387,  0.2722],
        [ 0.2431, -0.0934],
        [-0.1776,  0.3180],
        [-0.1377,  0.2538]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1425,  0.2963],
        [-0.3912,  0.4202],
        [-0.0037,  0.1463],
        [-0.4273,  0.4829],
        [ 0.0593,  0.2107],
        [ 0.3777, -0.0147],
        [-0.2057,  0.2873],
        [-0.2088,  0.3707],
        [-0.2201,  0.2861],
        [-0.0631,  0.1528],
        [-0.2655,  0.3466],
        [-0.1903,  0.4306]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0252,  0.2633],
        [-0.2195,  0.3499],
        [-0.0511,  0.2013],
        [-0.1051,  0.2311],
        [-0.1229,  0.2007],
        [-0.2384,  0.3707],
        [-0.4171,  0.4918],
        [-0.2926,  0.4039],
        [-0.2285,  0.3049],
        [-0.0818,  0.1422],
        [-0.2245,  0.3281],
        [-0.1441,  0.1977]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0565,  0.2502],
        [-0.0904,  0.2988],
        [-0.0441,  0.2014],
        [ 0.0045,  0.1761],
        [-0.2292,  0.3830],
        [-0.1480,  0.3737],
        [-0.2311,  0.3216],
        [-0.3365,  0.5344],
        [-0.2354,  0.3785],
        [ 0.0934,  0.0067],
        [-0.1471,  0.3328],
        [ 0.0546,  0.0959]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0182,  0.2262],
        [-0.1561,  0.2815],
        [-0.1506,  0.3340],
        [ 0.1498,  0.1397],
        [ 0.0359,  0.1691],
        [-0.0990,  0.3024],
        [-0.5341,  0.5386],
        [-0.1122,  0.3384],
        [-0.1615,  0.2399],
        [-0.0548,  0.3119],
        [-0.0548,  0.2531],
        [-0.0994,  0.3180]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.2288,  0.3207],
        [-0.0766,  0.3086],
        [-0.2010,  0.4467],
        [-0.1669,  0.2563],
        [-0.0321,  0.1967],
        [ 0.0393,  0.2289],
        [-0.2314,  0.3865],
        [-0.0155,  0.1570],
        [ 0.1068,  0.1458],
        [-0.2370,  0.5028],
        [ 0.0363,  0.2048],
        [-0.0554,  0.3206]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.1612,  0.2947],
        [-0.0222,  0.2555],
        [ 0.0109,  0.2900],
        [-0.0317,  0.1553],
        [-0.1096,  0.3315],
        [ 0.0502,  0.2548],
        [-0.3900,  0.5204],
        [-0.2672,  0.3948],
        [-0.2797,  0.3881],
        [-0.0406,  0.2746],
        [-0.0739,  0.2603],
        [-0.2659,  0.4274]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0050,  0.2691],
        [-0.1621,  0.3405],
        [-0.0279,  0.3009],
        [-0.1706,  0.2706],
        [-0.1210,  0.2416],
        [ 0.0643,  0.1647],
        [-0.0227,  0.2130],
        [-0.1131,  0.2402],
        [-0.2782,  0.3331],
        [-0.1490,  0.3634],
        [-0.1316,  0.4250],
        [-0.1968,  0.4055]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0640,  0.2279],
        [-0.1602,  0.3448],
        [-0.2688,  0.4199],
        [-0.1812,  0.4039],
        [-0.3299,  0.4113],
        [-0.0510,  0.1521],
        [-0.3322,  0.4038],
        [-0.2125,  0.4515],
        [-0.0903,  0.2505],
        [-0.1233,  0.3703],
        [-0.1287,  0.3060],
        [ 0.0624,  0.1865]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1605,  0.3950],
        [ 0.0160,  0.2024],
        [ 0.2822, -0.0185],
        [-0.2098,  0.4075],
        [-0.2207,  0.3846],
        [-0.1502,  0.3187],
        [-0.3250,  0.4708],
        [-0.4629,  0.5842],
        [-0.2215,  0.4455],
        [ 0.1701,  0.1223],
        [-0.0520,  0.1804],
        [-0.0347,  0.2490]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0998,  0.2089],
        [-0.2067,  0.4576],
        [-0.3343,  0.5079],
        [ 0.0049,  0.2153],
        [ 0.1015,  0.0651],
        [-0.1860,  0.3000],
        [-0.1770,  0.4428],
        [ 0.1385,  0.0984],
        [-0.0048,  0.1574],
        [-0.1401,  0.3676],
        [-0.1661,  0.4196],
        [-0.2804,  0.5939]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2842,  0.3141],
        [-0.2292,  0.3767],
        [-0.1413,  0.1941],
        [-0.0748,  0.1619],
        [-0.1612,  0.3500],
        [-0.0161,  0.2629],
        [-0.1828,  0.3129],
        [-0.2982,  0.5110],
        [-0.1619,  0.2542],
        [ 0.1505,  0.1337],
        [-0.3923,  0.5281],
        [-0.0265,  0.0890]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.5454,  0.7072],
        [-0.1306,  0.3068],
        [-0.0943,  0.2140],
        [-0.4263,  0.5497],
        [-0.0224,  0.2667],
        [-0.0171,  0.1698],
        [-0.2350,  0.4653],
        [-0.0352,  0.3090],
        [-0.0504,  0.3434],
        [-0.0672,  0.0803],
        [-0.3747,  0.5075],
        [-0.2556,  0.3374]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.1739,  0.3982],
        [ 0.0431,  0.2563],
        [-0.2537,  0.3515],
        [-0.1281,  0.2179],
        [-0.1244,  0.3581],
        [-0.2125,  0.3740],
        [-0.3479,  0.5519],
        [-0.2977,  0.3858],
        [-0.2858,  0.2604],
        [-0.1459,  0.3001],
        [-0.2214,  0.3568],
        [-0.2295,  0.4635]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0527,  0.1588],
        [-0.3724,  0.5218],
        [-0.0630,  0.1981],
        [ 0.0105,  0.1580],
        [ 0.0073,  0.2400],
        [-0.1710,  0.4922],
        [-0.2513,  0.4529],
        [-0.2783,  0.4360],
        [-0.1579,  0.3710],
        [-0.0542,  0.2192],
        [-0.1967,  0.3617],
        [-0.1032,  0.3135]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0707,  0.0866],
        [-0.3389,  0.4641],
        [-0.1134,  0.1844],
        [-0.2161,  0.3150],
        [-0.3031,  0.2532],
        [ 0.0017,  0.1741],
        [-0.4674,  0.6570],
        [-0.1419,  0.3870],
        [-0.2802,  0.3701],
        [-0.0227,  0.2727],
        [-0.1698,  0.3011],
        [-0.0175,  0.1754]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.2082,  0.4106],
        [-0.1813,  0.3613],
        [-0.1819,  0.3750],
        [-0.1952,  0.3437],
        [-0.0250,  0.2837],
        [-0.0189,  0.1243],
        [-0.2334,  0.4680],
        [ 0.0423,  0.0968],
        [-0.0281,  0.2875],
        [-0.2502,  0.4021],
        [-0.2191,  0.4355],
        [ 0.1753,  0.1469]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.2496,  0.3406],
        [-0.1221,  0.3793],
        [ 0.1414,  0.1180],
        [-0.0594,  0.1916],
        [-0.1132,  0.3054],
        [ 0.0071,  0.1792],
        [-0.1755,  0.4203],
        [-0.3367,  0.3980],
        [-0.3088,  0.4130],
        [-0.1805,  0.3368],
        [-0.0974,  0.2963],
        [-0.4020,  0.4711]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0994,  0.3626],
        [-0.1162,  0.2591],
        [-0.1004,  0.4524],
        [-0.1485,  0.2105],
        [ 0.2017,  0.0279],
        [ 0.0674,  0.1271],
        [-0.0974,  0.2729],
        [ 0.0099,  0.1011],
        [-0.1112,  0.3268],
        [ 0.0235,  0.0939],
        [-0.4019,  0.4968],
        [-0.2966,  0.4067]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.1774,  0.3366],
        [-0.1911,  0.2955],
        [-0.3716,  0.4545],
        [-0.2186,  0.3736],
        [-0.4208,  0.4233],
        [-0.0923,  0.3559],
        [-0.3279,  0.6293],
        [-0.2487,  0.3918],
        [-0.2661,  0.4051],
        [-0.5000,  0.5510],
        [-0.3894,  0.5567],
        [-0.0423,  0.2399]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-1.6453e-01,  3.3222e-01],
        [ 2.9971e-02,  1.3137e-01],
        [ 1.0026e-01,  1.1925e-01],
        [-2.4384e-01,  4.8862e-01],
        [-3.9590e-01,  5.0716e-01],
        [ 3.9649e-04,  1.6764e-01],
        [-2.3825e-01,  3.9736e-01],
        [-2.4540e-01,  2.9353e-01],
        [-5.2113e-01,  5.8886e-01],
        [-4.5361e-02,  1.8791e-01],
        [-1.2775e-01,  2.5346e-01],
        [ 9.0643e-02,  1.4702e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.0739,  0.2945],
        [-0.0764,  0.2244],
        [-0.4361,  0.4945],
        [-0.1775,  0.3148],
        [ 0.0502,  0.1669],
        [ 0.1071,  0.0315],
        [-0.2134,  0.3519],
        [ 0.0335,  0.1636],
        [-0.0315,  0.3106],
        [-0.2454,  0.4427],
        [-0.2726,  0.3209],
        [-0.0885,  0.3717]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2029,  0.4286],
        [-0.0406,  0.1315],
        [ 0.0490,  0.1608],
        [-0.0122,  0.2891],
        [-0.2309,  0.2690],
        [-0.1167,  0.2196],
        [-0.2693,  0.4759],
        [-0.2739,  0.3521],
        [-0.1846,  0.3234],
        [ 0.2928, -0.1070],
        [-0.2769,  0.4576],
        [-0.0263,  0.1810]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.4802,  0.6009],
        [-0.2338,  0.2984],
        [-0.2273,  0.4032],
        [-0.3247,  0.4846],
        [ 0.1046,  0.0839],
        [ 0.2343, -0.1419],
        [-0.0556,  0.2416],
        [-0.0794,  0.2994],
        [-0.2554,  0.3994],
        [ 0.0304,  0.2154],
        [-0.2832,  0.4341],
        [-0.0364,  0.2118]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0126,  0.3326],
        [-0.0220,  0.1966],
        [-0.3616,  0.4339],
        [-0.2345,  0.4186],
        [ 0.0666,  0.1938],
        [-0.3736,  0.5474],
        [-0.3987,  0.4699],
        [-0.0746,  0.2500],
        [-0.1954,  0.4223],
        [-0.0739,  0.0408],
        [-0.1172,  0.3285],
        [ 0.1112,  0.1352]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0830, -0.0046],
        [-0.0276,  0.3614],
        [-0.0167,  0.2537],
        [-0.0303,  0.1455],
        [-0.0714,  0.3232],
        [-0.1010,  0.2706],
        [-0.2582,  0.4249],
        [-0.1678,  0.4506],
        [-0.1792,  0.4155],
        [-0.0911,  0.3022],
        [-0.1422,  0.3375],
        [-0.2080,  0.2255]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1750,  0.3836],
        [-0.1663,  0.3542],
        [-0.3329,  0.4708],
        [-0.1212,  0.3164],
        [ 0.1819, -0.0805],
        [ 0.1052,  0.1447],
        [-0.3843,  0.4943],
        [-0.2846,  0.5517],
        [-0.1059,  0.3642],
        [ 0.0569,  0.2799],
        [-0.2991,  0.6145],
        [-0.0893,  0.2718]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0918,  0.3234],
        [ 0.0498,  0.2615],
        [ 0.0291,  0.1734],
        [-0.1627,  0.3723],
        [ 0.0591,  0.2109],
        [ 0.0035,  0.2002],
        [-0.1474,  0.3468],
        [-0.0353,  0.1712],
        [ 0.1072,  0.0886],
        [-0.2360,  0.3789],
        [-0.1123,  0.2021],
        [ 0.0732,  0.2087]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0742,  0.1170],
        [ 0.1515,  0.0689],
        [-0.1464,  0.3305],
        [-0.2533,  0.3062],
        [ 0.0118,  0.3170],
        [ 0.0142,  0.1927],
        [-0.1013,  0.2990],
        [-0.0336,  0.2441],
        [-0.0292,  0.3513],
        [-0.0383,  0.2023],
        [-0.2175,  0.3317],
        [-0.3377,  0.5116]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-7.9588e-02,  3.1798e-01],
        [-2.2201e-01,  3.5652e-01],
        [ 9.9182e-02,  2.4317e-01],
        [ 1.6228e-04,  3.3273e-01],
        [ 2.9884e-02,  2.1568e-01],
        [ 8.7904e-02,  1.3494e-01],
        [-1.5524e-01,  4.5610e-01],
        [-1.6073e-01,  2.0304e-01],
        [-1.6238e-01,  3.3472e-01],
        [ 1.6414e-01,  2.4692e-02],
        [-1.5243e-01,  2.5700e-01],
        [-3.3734e-01,  4.7315e-01]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.1689,  0.2581],
        [ 0.1059,  0.1846],
        [-0.0783,  0.4237],
        [-0.0447,  0.2534],
        [-0.2568,  0.3364],
        [-0.0080,  0.2349],
        [-0.1579,  0.3250],
        [-0.1823,  0.3051],
        [ 0.0033,  0.3474],
        [-0.1222,  0.3559],
        [-0.2786,  0.4460],
        [ 0.0944,  0.2337]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0868,  0.2916],
        [ 0.0207,  0.1230],
        [ 0.0422,  0.2141],
        [ 0.1136,  0.1356],
        [-0.1347,  0.2351],
        [ 0.1115,  0.0962],
        [-0.2632,  0.4354],
        [-0.1608,  0.2725],
        [-0.2417,  0.2151],
        [ 0.0189,  0.0560],
        [ 0.0627,  0.1456],
        [ 0.2062,  0.1758]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.1246,  0.2159],
        [-0.1540,  0.3180],
        [-0.2668,  0.3378],
        [-0.0100,  0.1980],
        [ 0.1197, -0.0919],
        [-0.1392,  0.2867],
        [ 0.0031,  0.2902],
        [ 0.0660,  0.1092],
        [-0.0084,  0.2072],
        [ 0.0011,  0.2586],
        [-0.0308,  0.3710],
        [-0.3017,  0.6511]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2893,  0.4658],
        [-0.2027,  0.3620],
        [-0.1467,  0.2994],
        [-0.2327,  0.4100],
        [ 0.1249,  0.1164],
        [ 0.0950,  0.1467],
        [-0.0275,  0.0642],
        [-0.1681,  0.2699],
        [-0.0479,  0.2544],
        [ 0.2505, -0.0024],
        [-0.3155,  0.3415],
        [-0.0166,  0.2093]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.4046,  0.4639],
        [-0.1249,  0.3516],
        [ 0.1600,  0.0694],
        [-0.2727,  0.5148],
        [ 0.0641,  0.2103],
        [ 0.3297, -0.1412],
        [ 0.0309,  0.3128],
        [-0.2116,  0.2195],
        [ 0.0983,  0.2085],
        [-0.0288,  0.2252],
        [-0.3098,  0.5251],
        [-0.0149,  0.1103]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0150,  0.3219],
        [-0.2097,  0.3172],
        [-0.2158,  0.4335],
        [-0.2430,  0.4095],
        [-0.1033,  0.2729],
        [-0.4386,  0.5856],
        [-0.3665,  0.3945],
        [-0.0755,  0.3470],
        [-0.2973,  0.4837],
        [ 0.0386,  0.2844],
        [-0.1081,  0.3046],
        [ 0.0241,  0.2036]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.3077,  0.3128],
        [-0.1719,  0.5129],
        [-0.0074,  0.2313],
        [-0.0957,  0.2267],
        [-0.2155,  0.4011],
        [-0.1376,  0.3308],
        [-0.3091,  0.5221],
        [-0.3709,  0.5419],
        [-0.1841,  0.4317],
        [-0.2207,  0.3046],
        [-0.1763,  0.2930],
        [-0.1859,  0.4032]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.2139,  0.3548],
        [-0.3592,  0.4126],
        [-0.2290,  0.4894],
        [ 0.1480,  0.0698],
        [-0.1755,  0.3611],
        [-0.0386,  0.4493],
        [-0.4685,  0.6556],
        [-0.2191,  0.4634],
        [-0.0757,  0.2505],
        [-0.0047,  0.2960],
        [-0.3480,  0.3999],
        [-0.1329,  0.2416]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.0506,  0.2718],
        [-0.2054,  0.2532],
        [-0.2830,  0.4705],
        [ 0.0024,  0.1975],
        [-0.1241,  0.3259],
        [ 0.0485,  0.0500],
        [-0.3443,  0.4826],
        [ 0.1770,  0.2440],
        [ 0.2107,  0.0615],
        [-0.1774,  0.3748],
        [-0.0936,  0.2940],
        [ 0.0824,  0.2243]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0877,  0.0202],
        [-0.0988,  0.2511],
        [-0.1542,  0.2787],
        [-0.1430,  0.3284],
        [-0.1142,  0.3349],
        [ 0.1428,  0.0584],
        [-0.1963,  0.4108],
        [-0.2722,  0.3560],
        [-0.0751,  0.2634],
        [ 0.1420,  0.0639],
        [-0.2823,  0.3956],
        [-0.2237,  0.3378]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.0421,  0.0606],
        [-0.0672,  0.3241],
        [ 0.1090,  0.1026],
        [-0.1260,  0.3277],
        [-0.2586,  0.4832],
        [ 0.0471,  0.1945],
        [-0.2645,  0.5532],
        [-0.0363,  0.1894],
        [-0.1501,  0.2382],
        [-0.0068,  0.1429],
        [-0.2674,  0.3946],
        [-0.2512,  0.5400]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0062,  0.1051],
        [-0.0987,  0.2644],
        [-0.0900,  0.4637],
        [-0.3162,  0.2896],
        [-0.4049,  0.4746],
        [-0.0520,  0.2268],
        [-0.2688,  0.4815],
        [-0.2676,  0.4116],
        [-0.3066,  0.5419],
        [-0.1197,  0.3130],
        [-0.1947,  0.3260],
        [-0.0142,  0.2544]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.2058,  0.3621],
        [ 0.0377,  0.2159],
        [-0.1599,  0.2558],
        [-0.1862,  0.3126],
        [-0.2279,  0.4576],
        [ 0.0886,  0.1775],
        [-0.1619,  0.3114],
        [-0.3047,  0.5473],
        [-0.3090,  0.4347],
        [ 0.0147,  0.1728],
        [-0.1181,  0.2175],
        [-0.1477,  0.3619]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.3630,  0.4876],
        [-0.1832,  0.3526],
        [-0.2792,  0.4520],
        [-0.1102,  0.3192],
        [ 0.1713,  0.1239],
        [-0.0379,  0.3018],
        [-0.1614,  0.3384],
        [-0.1400,  0.3122],
        [-0.4124,  0.5704],
        [-0.2136,  0.3682],
        [-0.1885,  0.3039],
        [-0.0671,  0.3530]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.3499,  0.3549],
        [-0.3032,  0.3871],
        [-0.2469,  0.3254],
        [-0.1219,  0.1957],
        [-0.1827,  0.2593],
        [ 0.1505, -0.0790],
        [ 0.0379,  0.0947],
        [-0.1693,  0.2773],
        [-0.0015,  0.2599],
        [-0.0770,  0.2993],
        [-0.3871,  0.5332],
        [ 0.1270,  0.1533]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.2237,  0.4131],
        [-0.2163,  0.2337],
        [ 0.0668,  0.1229],
        [-0.1480,  0.2871],
        [-0.0417,  0.2160],
        [ 0.2128, -0.0778],
        [-0.0392,  0.3543],
        [-0.0513,  0.1234],
        [ 0.1213,  0.0301],
        [-0.1067,  0.2332],
        [-0.1263,  0.4505],
        [-0.1031,  0.3132]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.1122,  0.2094],
        [-0.0253,  0.0846],
        [-0.2046,  0.3481],
        [-0.0177,  0.2115],
        [-0.1466,  0.3210],
        [-0.3022,  0.4008],
        [-0.3701,  0.4652],
        [-0.2153,  0.4784],
        [-0.2390,  0.5243],
        [ 0.0323, -0.0348],
        [-0.2373,  0.3213],
        [-0.0538,  0.1299]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.0423,  0.0884],
        [-0.2563,  0.4156],
        [ 0.0571,  0.1564],
        [-0.2271,  0.3243],
        [-0.1292,  0.2849],
        [-0.1814,  0.3651],
        [-0.3410,  0.4619],
        [-0.0990,  0.3529],
        [-0.0517,  0.2643],
        [-0.0444,  0.1790],
        [-0.1222,  0.3155],
        [-0.1279,  0.4639]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0849,  0.2542],
        [-0.4008,  0.5259],
        [-0.1513,  0.3492],
        [-0.1552,  0.2204],
        [-0.0734,  0.3081],
        [-0.0624,  0.2013],
        [-0.4236,  0.4623],
        [-0.2327,  0.4541],
        [-0.1919,  0.3760],
        [-0.0635,  0.2235],
        [-0.3977,  0.5142],
        [-0.0848,  0.3103]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.1454,  0.2952],
        [-0.0779,  0.3142],
        [-0.1917,  0.3550],
        [-0.0536,  0.2869],
        [-0.0999,  0.1573],
        [-0.1270,  0.3269],
        [-0.1685,  0.1893],
        [ 0.1601,  0.1605],
        [ 0.0476,  0.1826],
        [-0.0783,  0.2458],
        [-0.1217,  0.3572],
        [ 0.0139,  0.2375]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.1162,  0.2684],
        [-0.2917,  0.3529],
        [-0.1258,  0.3279],
        [-0.1475,  0.1602],
        [ 0.1087,  0.0716],
        [ 0.0752,  0.0489],
        [-0.0121,  0.1722],
        [-0.3894,  0.4003],
        [-0.1657,  0.4278],
        [-0.1353,  0.3167],
        [-0.1039,  0.2863],
        [-0.1206,  0.3004]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.2237,  0.3705],
        [-0.1304,  0.3227],
        [-0.0245,  0.2841],
        [-0.3025,  0.4483],
        [ 0.0020,  0.0262],
        [-0.0038,  0.2113],
        [-0.1619,  0.2562],
        [ 0.0156,  0.0809],
        [-0.0394,  0.2534],
        [-0.1006,  0.3163],
        [-0.1894,  0.4154],
        [-0.1831,  0.4979]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.0752,  0.0502],
        [-0.0260,  0.3066],
        [-0.2018,  0.4684],
        [-0.1902,  0.3799],
        [-0.2894,  0.4318],
        [-0.2515,  0.3578],
        [-0.2611,  0.3552],
        [-0.2393,  0.3274],
        [-0.3394,  0.5299],
        [-0.3645,  0.5956],
        [-0.3359,  0.4836],
        [-0.3162,  0.5259]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0910,  0.2882],
        [-0.1237,  0.2575],
        [-0.0740,  0.0738],
        [-0.1670,  0.1881],
        [-0.3657,  0.5248],
        [ 0.0037,  0.2841],
        [-0.3751,  0.5005],
        [-0.5697,  0.6653],
        [-0.4952,  0.6327],
        [-0.0170,  0.1564],
        [-0.2078,  0.3520],
        [-0.2345,  0.3637]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.3119,  0.4492],
        [ 0.0041,  0.1453],
        [-0.4723,  0.6212],
        [ 0.0917,  0.1273],
        [ 0.1071,  0.2270],
        [-0.1014,  0.2429],
        [-0.2283,  0.3998],
        [-0.1965,  0.2306],
        [-0.0230,  0.1718],
        [-0.2137,  0.3213],
        [-0.1615,  0.3199],
        [-0.1881,  0.5542]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2388,  0.3533],
        [ 0.0142,  0.2612],
        [-0.4007,  0.4436],
        [-0.1380,  0.2048],
        [-0.1777,  0.2213],
        [ 0.0109,  0.1005],
        [-0.1809,  0.3974],
        [-0.2445,  0.3444],
        [ 0.0098,  0.1531],
        [ 0.2414,  0.0195],
        [-0.3403,  0.5453],
        [-0.2163,  0.3612]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.3267,  0.4616],
        [-0.1942,  0.3542],
        [-0.1293,  0.3161],
        [-0.2897,  0.4588],
        [-0.1523,  0.2253],
        [ 0.3671, -0.1177],
        [-0.1252,  0.4610],
        [-0.1351,  0.3720],
        [-0.0039,  0.2250],
        [-0.0162,  0.1671],
        [-0.3838,  0.5332],
        [-0.0865,  0.2562]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.2235,  0.4585],
        [-0.0498,  0.1825],
        [-0.1797,  0.2479],
        [-0.2586,  0.4383],
        [-0.0263,  0.2851],
        [-0.3679,  0.5779],
        [-0.4133,  0.5636],
        [-0.4249,  0.5299],
        [-0.3725,  0.5737],
        [-0.1918,  0.4493],
        [-0.4187,  0.4090],
        [-0.1499,  0.2613]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.2505,  0.4042],
        [-0.3020,  0.6168],
        [ 0.0269,  0.2074],
        [-0.2832,  0.4294],
        [-0.0415,  0.3334],
        [-0.3098,  0.4969],
        [-0.3293,  0.5435],
        [-0.3491,  0.5300],
        [-0.3072,  0.4966],
        [ 0.1954, -0.0013],
        [-0.3231,  0.4748],
        [ 0.1322,  0.1280]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.2117,  0.4125],
        [-0.2060,  0.4461],
        [-0.1610,  0.4127],
        [-0.1749,  0.3452],
        [-0.2041,  0.3841],
        [-0.1971,  0.3987],
        [-0.4174,  0.4670],
        [-0.1234,  0.4183],
        [-0.2409,  0.4300],
        [-0.3783,  0.4998],
        [-0.2377,  0.3499],
        [-0.3094,  0.3806]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.1422,  0.3268],
        [-0.1905,  0.3519],
        [ 0.0656,  0.1982],
        [-0.2863,  0.4270],
        [-0.1095,  0.3174],
        [-0.2087,  0.3711],
        [-0.0979,  0.2981],
        [-0.0499,  0.2673],
        [-0.0242,  0.1806],
        [-0.2528,  0.3853],
        [-0.2513,  0.4996],
        [-0.0190,  0.2764]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[ 0.0818, -0.0058],
        [-0.1181,  0.1981],
        [-0.2763,  0.5085],
        [-0.4502,  0.4658],
        [-0.3983,  0.4100],
        [-0.0190,  0.2106],
        [-0.2781,  0.4235],
        [-0.3440,  0.5305],
        [-0.0238,  0.1552],
        [-0.1008,  0.2377],
        [-0.1449,  0.3117],
        [-0.4200,  0.5611]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1087,  0.2573],
        [-0.4202,  0.4872],
        [ 0.1969, -0.0634],
        [-0.2151,  0.3199],
        [ 0.0153,  0.2600],
        [-0.1012,  0.4030],
        [-0.1103,  0.4003],
        [-0.0242,  0.1193],
        [-0.0631,  0.2450],
        [-0.1572,  0.2115],
        [-0.1302,  0.3153],
        [-0.2970,  0.6183]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0469,  0.0333],
        [-0.1190,  0.2513],
        [-0.3624,  0.5031],
        [-0.4196,  0.5781],
        [-0.2902,  0.4668],
        [-0.0761,  0.1827],
        [-0.3348,  0.5211],
        [-0.2743,  0.5753],
        [-0.2158,  0.5294],
        [-0.2767,  0.4711],
        [-0.3356,  0.4160],
        [-0.0080,  0.2384]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.3404,  0.5231],
        [-0.0241,  0.1682],
        [ 0.0724,  0.2032],
        [-0.1060,  0.3330],
        [-0.4343,  0.5749],
        [-0.1542,  0.2311],
        [-0.1510,  0.2917],
        [-0.3608,  0.4113],
        [-0.3984,  0.5450],
        [ 0.0435,  0.2527],
        [-0.1436,  0.3084],
        [-0.3024,  0.3914]], device='cuda:0', grad_fn=<AddmmBackward>)
