Iter #50: tensor([[-0.2266, -0.6002],
        [-0.2264, -0.4030],
        [-0.2126, -0.6896],
        [-0.0411, -0.5784],
        [-0.0291, -0.6444],
        [-0.3560, -0.6786],
        [-0.3889, -0.5312],
        [-0.2597, -0.5754],
        [-0.1757, -0.6275],
        [-0.2746, -0.5026],
        [-0.2355, -0.6381],
        [-0.2436, -0.5833]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.3998, -0.2002],
        [-0.2017, -0.4732],
        [-0.2913,  0.0089],
        [-0.1632, -0.1353],
        [-0.2946, -0.2527],
        [-0.0811, -0.4746],
        [-0.2257, -0.3925],
        [-0.4439, -0.0062],
        [ 0.0530, -0.3923],
        [-0.2412, -0.5429],
        [-0.2417, -0.4157],
        [-0.1627, -0.3857]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1770,  0.0262],
        [-0.0943, -0.4214],
        [-0.3768, -0.1128],
        [ 0.2013, -0.5495],
        [-0.0010, -0.6387],
        [-0.5244, -0.1277],
        [-0.1457, -0.2570],
        [-0.0717, -0.4128],
        [-0.4927, -0.0033],
        [-0.1977, -0.2848],
        [-0.2584, -0.2078],
        [-0.2836, -0.1054]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.0751, -0.4566],
        [-0.2623, -0.0426],
        [-0.3876, -0.2022],
        [-0.2637,  0.0197],
        [-0.1563,  0.1721],
        [-0.0676, -0.4472],
        [-0.2986, -0.1369],
        [ 0.0307, -0.4907],
        [-0.0380, -0.1589],
        [-0.3377, -0.2077],
        [-0.0813, -0.5505],
        [-0.2244, -0.1484]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.1955, -0.4743],
        [-0.2535, -0.2367],
        [-0.2770, -0.1358],
        [-0.3392, -0.2583],
        [-0.2073, -0.1273],
        [ 0.0906, -0.4796],
        [-0.4418, -0.0267],
        [-0.3551, -0.3614],
        [-0.3309, -0.1947],
        [-0.3817, -0.2624],
        [-0.2134, -0.2379],
        [-0.0477, -0.2797]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.2924, -0.3740],
        [-0.1996, -0.3646],
        [ 0.0169, -0.6213],
        [-0.2516, -0.3029],
        [-0.2697, -0.0839],
        [-0.1535, -0.0899],
        [ 0.0596, -0.3022],
        [ 0.0769, -0.4387],
        [-0.6615,  0.2777],
        [-0.2989, -0.2185],
        [-0.1653, -0.1593],
        [-0.1804, -0.3834]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.3033, -0.1301],
        [ 0.1085, -0.6786],
        [-0.1010, -0.3709],
        [-0.4455, -0.0764],
        [ 0.2254, -0.2715],
        [-0.4068, -0.0986],
        [-0.0906, -0.5129],
        [-0.3592, -0.1125],
        [-0.2349, -0.0127],
        [-0.0059, -0.0752],
        [-0.2089, -0.1892],
        [-0.1403, -0.3814]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.4547, -0.0995],
        [ 0.0871, -0.5359],
        [-0.1199, -0.3573],
        [-0.4181, -0.0434],
        [-0.3545,  0.0627],
        [-0.3973, -0.0706],
        [-0.1129, -0.2460],
        [-0.1782, -0.2713],
        [-0.1496, -0.1162],
        [-0.3375, -0.0107],
        [-0.0059, -0.4063],
        [-0.1312, -0.1145]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.4995,  0.0135],
        [-0.2546, -0.0936],
        [ 0.0881, -0.4376],
        [-0.1911, -0.1630],
        [ 0.1175, -0.5228],
        [-0.1970, -0.2512],
        [-0.3111, -0.2431],
        [ 0.0924, -0.5899],
        [-0.2452, -0.0064],
        [-0.2508, -0.2200],
        [ 0.1629, -0.3525],
        [-0.1154, -0.3986]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.3324, -0.0010],
        [ 0.0440, -0.4198],
        [-0.1962, -0.2835],
        [-0.4905,  0.0287],
        [-0.4866,  0.1695],
        [-0.4154, -0.0765],
        [-0.3618, -0.1319],
        [-0.2654, -0.1405],
        [-0.0261, -0.4215],
        [-0.3682, -0.2320],
        [-0.2209, -0.1721],
        [-0.3842, -0.1954]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.0426, -0.1983],
        [ 0.1671, -0.2859],
        [-0.0722, -0.4142],
        [-0.3680,  0.0370],
        [-0.0585, -0.1187],
        [-0.3804,  0.0513],
        [-0.7011,  0.1597],
        [-0.0205, -0.3668],
        [ 0.0892, -0.4701],
        [-0.5352, -0.2206],
        [-0.1038, -0.2468],
        [-0.1649, -0.2245]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.3859,  0.0523],
        [-0.5130, -0.2011],
        [-0.4007, -0.0926],
        [-0.2153, -0.1187],
        [-0.2343, -0.1240],
        [-0.0661, -0.3378],
        [-0.2042, -0.0316],
        [-0.0533, -0.6413],
        [ 0.1454, -0.5292],
        [ 0.1595, -0.5663],
        [-0.2963, -0.0598],
        [ 0.1918, -0.6698]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.3527,  0.0770],
        [-0.1075, -0.4517],
        [-0.5550, -0.0558],
        [-0.3552, -0.1995],
        [-0.1250, -0.0920],
        [ 0.0195, -0.4678],
        [-0.0071, -0.3955],
        [-0.5804,  0.0710],
        [-0.3029, -0.1344],
        [-0.3211, -0.2024],
        [ 0.0487, -0.6668],
        [ 0.1253, -0.4022]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.3468, -0.0337],
        [-0.1552, -0.2095],
        [-0.3693,  0.2400],
        [ 0.0620, -0.4923],
        [ 0.2677, -0.6712],
        [-0.7675,  0.0882],
        [ 0.1730, -0.3895],
        [-0.0335, -0.3548],
        [-0.6073,  0.2847],
        [-0.1298, -0.5201],
        [-0.2658, -0.2497],
        [-0.2062, -0.3192]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1110, -0.3956],
        [ 0.2238, -0.5596],
        [-0.5033,  0.1150],
        [-0.1359, -0.1009],
        [-0.2843, -0.2036],
        [ 0.0514, -0.4150],
        [-0.1173, -0.4539],
        [-0.1659, -0.4582],
        [-0.4072,  0.0929],
        [-0.4296,  0.0380],
        [ 0.0890, -0.6041],
        [-0.3137, -0.1188]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.2474, -0.6419],
        [-0.2576, -0.1503],
        [-0.0457, -0.3684],
        [-0.0340, -0.2969],
        [-0.1248, -0.2381],
        [-0.0388, -0.4010],
        [-0.2204, -0.2293],
        [-0.6025,  0.1050],
        [-0.1045, -0.3814],
        [ 0.0763, -0.4967],
        [-0.1287, -0.3179],
        [-0.2312, -0.2799]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.3568, -0.1494],
        [-0.1825, -0.3070],
        [-0.3733, -0.1260],
        [ 0.1377, -0.6277],
        [-0.3872, -0.2348],
        [-0.2026, -0.2073],
        [-0.0325, -0.2472],
        [-0.1373, -0.3648],
        [-0.7738,  0.1734],
        [-0.4200, -0.1598],
        [-0.4072, -0.1483],
        [-0.0505, -0.1701]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.8787,  0.1494],
        [ 0.1738, -0.6099],
        [-0.4148, -0.0277],
        [-0.2873, -0.0200],
        [ 0.2389, -0.8248],
        [-0.4618, -0.0033],
        [-0.1649, -0.4321],
        [-0.4721, -0.0476],
        [-0.5488,  0.0398],
        [-0.1613, -0.2267],
        [-0.2748,  0.0922],
        [-0.2366, -0.2372]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.1885, -0.3898],
        [-0.0060, -0.1196],
        [-0.1037, -0.5647],
        [-0.5110, -0.1639],
        [-0.2887, -0.1937],
        [-0.0272, -0.3361],
        [-0.4983,  0.0658],
        [-0.4804, -0.0471],
        [-0.4398,  0.0269],
        [-0.5161,  0.3151],
        [ 0.0028, -0.4961],
        [-0.0293, -0.4030]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1701, -0.1337],
        [-0.3574,  0.1825],
        [-0.3216, -0.0751],
        [-0.3002, -0.2181],
        [-0.0142, -0.5928],
        [-0.0277, -0.2071],
        [-0.4846,  0.2413],
        [-0.3935,  0.1185],
        [-0.0713, -0.2437],
        [ 0.0999, -0.7106],
        [ 0.2178, -0.4154],
        [ 0.0118, -0.5942]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.2197, -0.3492],
        [-0.3233, -0.1031],
        [-0.2020, -0.3208],
        [-0.5481,  0.0591],
        [ 0.0028, -0.0889],
        [-0.3771,  0.0869],
        [-0.1365, -0.1412],
        [-0.4247,  0.0440],
        [-0.1163, -0.1082],
        [-0.0146, -0.3055],
        [ 0.0176, -0.3796],
        [-0.2902, -0.0489]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[ 0.1787, -0.3390],
        [ 0.2052, -0.7661],
        [-0.2251, -0.1895],
        [-0.2926,  0.1156],
        [-0.2113, -0.1659],
        [-0.3045,  0.0522],
        [-0.5277,  0.2659],
        [-0.0345, -0.4355],
        [ 0.1212, -0.3910],
        [-0.3712, -0.3327],
        [-0.0185, -0.3270],
        [ 0.0250, -0.3828]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[ 0.0146, -0.2926],
        [-0.4797, -0.2712],
        [ 0.0071, -0.2780],
        [-0.2157, -0.2553],
        [-0.4350, -0.2169],
        [ 0.2351, -0.6128],
        [-0.4171,  0.0342],
        [-0.1961, -0.1426],
        [-0.1088, -0.2561],
        [ 0.2870, -0.6054],
        [-0.5415,  0.1202],
        [-0.2889, -0.3261]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0144, -0.3110],
        [ 0.0061, -0.3800],
        [-0.4184,  0.0266],
        [-0.2972, -0.0608],
        [-0.4116,  0.0633],
        [-0.1390,  0.0514],
        [-0.0670, -0.4789],
        [-0.5215,  0.1170],
        [-0.1378, -0.3040],
        [-0.1011, -0.3660],
        [-0.5351,  0.0874],
        [-0.2208, -0.0735]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.1546,  0.0994],
        [-0.1382, -0.4328],
        [-0.5070,  0.2238],
        [ 0.2863, -0.5934],
        [ 0.0639, -0.4249],
        [-0.4635, -0.1759],
        [ 0.1199, -0.5213],
        [ 0.0590, -0.6347],
        [-0.8404,  0.5207],
        [ 0.1405, -0.6807],
        [-0.1408, -0.2999],
        [-0.0337, -0.3373]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0587, -0.4509],
        [-0.1849, -0.1923],
        [-0.2637,  0.0528],
        [-0.5469,  0.2082],
        [-0.3556, -0.3987],
        [-0.2198, -0.3337],
        [-0.2713,  0.1769],
        [-0.1779, -0.2515],
        [-0.5319,  0.0219],
        [-0.1626, -0.0573],
        [-0.0272, -0.4560],
        [-0.3422, -0.1217]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[ 0.1925, -0.3885],
        [ 0.0508, -0.3667],
        [ 0.0453, -0.3239],
        [-0.3383, -0.0091],
        [-0.2011,  0.0259],
        [-0.0081, -0.5006],
        [-0.2229, -0.1340],
        [-0.4790, -0.1151],
        [-0.0367, -0.3312],
        [-0.1680, -0.1600],
        [-0.1982,  0.0464],
        [ 0.3309, -0.5192]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.1979, -0.4995],
        [-0.2588, -0.1572],
        [-0.3920, -0.2437],
        [-0.2631, -0.1903],
        [ 0.0730, -0.3018],
        [-0.2167, -0.3576],
        [-0.0095, -0.4544],
        [ 0.2449, -0.3614],
        [-0.7184,  0.5114],
        [-0.3704, -0.0833],
        [-0.5045,  0.0777],
        [-0.2505, -0.2570]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.7504,  0.2687],
        [-0.0113, -0.4353],
        [ 0.2007, -0.3713],
        [-0.4241,  0.2337],
        [-0.1504, -0.1824],
        [-0.4282,  0.0528],
        [-0.1185, -0.1609],
        [-0.2880, -0.0887],
        [-0.1896, -0.1039],
        [-0.2530, -0.0923],
        [-0.3950, -0.3094],
        [-0.1830, -0.2311]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.1607, -0.3006],
        [ 0.2878, -0.5921],
        [ 0.3608, -0.6575],
        [-0.3076, -0.0612],
        [-0.2917, -0.0469],
        [-0.4370,  0.0816],
        [-0.3441,  0.0494],
        [-0.3122, -0.2379],
        [-0.1663, -0.2414],
        [-0.2799, -0.2049],
        [ 0.1707, -0.2851],
        [-0.1456, -0.1760]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.1974, -0.3092],
        [-0.4293, -0.0964],
        [-0.3588, -0.1816],
        [-0.1709, -0.3518],
        [-0.1805, -0.5203],
        [-0.0420, -0.3032],
        [-0.2930,  0.1452],
        [ 0.0691, -0.3801],
        [-0.2484, -0.1292],
        [ 0.0842, -0.5918],
        [ 0.2479, -0.6050],
        [-0.3070, -0.0719]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.3454,  0.0604],
        [ 0.0397, -0.3920],
        [-0.3565,  0.0682],
        [-0.3909,  0.0623],
        [-0.4250,  0.0936],
        [-0.3508,  0.1327],
        [ 0.1160, -0.3598],
        [-0.3763, -0.1472],
        [-0.2273,  0.0143],
        [-0.2960, -0.0439],
        [-0.0414, -0.2231],
        [-0.1293, -0.3387]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1770, -0.3657],
        [ 0.2382, -0.6671],
        [-0.2793, -0.2337],
        [-0.1983, -0.0096],
        [-0.3409, -0.1064],
        [-0.1132, -0.2834],
        [-0.5440,  0.2329],
        [-0.0793, -0.4338],
        [-0.2038, -0.2112],
        [-0.5348,  0.0643],
        [ 0.0648, -0.2640],
        [-0.4157,  0.0205]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #50: tensor([[-0.2865, -0.1941],
        [-0.2077, -0.3808],
        [ 0.0170, -0.4994],
        [-0.1333, -0.2662],
        [-0.2654,  0.1113],
        [-0.0035, -0.1447],
        [-0.2203, -0.2917],
        [ 0.0446, -0.4228],
        [-0.2667, -0.0151],
        [ 0.0335, -0.5539],
        [-0.1321, -0.2200],
        [ 0.1247, -0.3897]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.4542, -0.1278],
        [ 0.1881, -0.5496],
        [-0.5090,  0.1863],
        [-0.0559, -0.2272],
        [ 0.0395, -0.3181],
        [-0.1949, -0.2298],
        [-0.2499, -0.1797],
        [-0.3050, -0.1978],
        [-0.0979, -0.1071],
        [-0.1381, -0.3266],
        [-0.3744, -0.0601],
        [ 0.1133, -0.3968]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.4589,  0.0911],
        [-0.2333, -0.3371],
        [-0.4600,  0.2703],
        [ 0.0881, -0.4787],
        [-0.0750, -0.4234],
        [-0.5107,  0.1483],
        [-0.0746, -0.2591],
        [-0.3612, -0.0193],
        [-0.2769,  0.0148],
        [-0.0206, -0.3541],
        [ 0.3012, -0.4306],
        [-0.3058,  0.0770]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.0481, -0.4085],
        [ 0.1533, -0.3080],
        [-0.3920, -0.0137],
        [-0.2908, -0.2246],
        [-0.0893, -0.2253],
        [-0.0762, -0.1302],
        [-0.2301, -0.0881],
        [-0.2248, -0.3049],
        [-0.3023, -0.3422],
        [-0.1120, -0.3328],
        [ 0.3402, -0.4198],
        [-0.6133, -0.0632]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.2319, -0.2255],
        [-0.2771, -0.0743],
        [-0.1559, -0.2543],
        [-0.3402, -0.3566],
        [-0.0945, -0.2989],
        [ 0.1487, -0.3957],
        [-0.0364, -0.1354],
        [-0.1667, -0.3659],
        [-0.1735, -0.0781],
        [-0.0863, -0.0163],
        [-0.2142, -0.1570],
        [ 0.0676, -0.3669]], device='cuda:0', grad_fn=<AddmmBackward>)
