Iter #50: tensor([[-0.9952, -0.0081, -0.0179],
        [-1.0823, -0.1509,  0.0622],
        [-0.9673,  0.1022, -0.1257],
        [-1.0432,  0.0105,  0.0517],
        [-0.9297,  0.0874, -0.0288],
        [-1.0672,  0.0121, -0.3099],
        [-0.8410,  0.2061, -0.0532],
        [-0.8301,  0.1763, -0.1051],
        [-0.9026,  0.2773, -0.2682],
        [-0.9868,  0.2689, -0.1305],
        [-1.0675,  0.0749,  0.0882],
        [-0.7830,  0.2718, -0.1754]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-1.1118,  0.3347,  0.0832],
        [-1.2591,  0.0955, -0.0224],
        [-1.1692,  0.2347,  0.0792],
        [-1.0616,  0.1695,  0.0842],
        [-0.9391,  0.2526, -0.0698],
        [-1.2660,  0.2854, -0.1909],
        [-1.2191,  0.1841,  0.0763],
        [-1.0422,  0.2574,  0.0715],
        [-1.1144,  0.3266,  0.0748],
        [-1.1443,  0.0330, -0.0361],
        [-1.1190,  0.2860,  0.0101],
        [-1.2211,  0.2925, -0.1946]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.9335, -0.2290,  0.3346],
        [-1.1271, -0.0026,  0.3576],
        [-0.9121, -0.2514,  0.4435],
        [-1.0594, -0.0025,  0.2420],
        [-0.7577, -0.0158,  0.1784],
        [-0.8757, -0.1009,  0.5360],
        [-1.0284,  0.0426,  0.3323],
        [-0.8821, -0.4307,  0.0883],
        [-0.9574, -0.1690,  0.3772],
        [-1.1083, -0.1700,  0.3845],
        [-0.9668,  0.0679,  0.0549],
        [-1.1235, -0.0686,  0.3296]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-1.0502,  0.1712, -0.1498],
        [-1.0188,  0.0819, -0.1030],
        [-1.0805,  0.1994, -0.1098],
        [-1.0446,  0.0510, -0.0171],
        [-1.0878,  0.3440, -0.0631],
        [-0.9205,  0.2563, -0.0459],
        [-0.9043,  0.0611, -0.0107],
        [-0.9009,  0.1349,  0.0383],
        [-1.1424, -0.0432,  0.0553],
        [-0.8951,  0.0276, -0.0332],
        [-0.9286,  0.0130,  0.2626],
        [-0.9981,  0.3402, -0.2681]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-7.3761e-01,  4.7157e-01, -3.3311e-01],
        [-1.0734e+00,  2.4445e-01, -5.5301e-02],
        [-9.9574e-01,  9.6018e-02,  6.8543e-02],
        [-1.0084e+00,  2.0452e-01, -4.6608e-02],
        [-1.0318e+00,  1.1276e-01,  4.7996e-02],
        [-7.9972e-01,  1.0676e-01, -1.1680e-01],
        [-7.5191e-01, -9.2551e-02,  3.3824e-01],
        [-9.5047e-01,  1.3688e-01,  7.1176e-02],
        [-9.9294e-01, -1.6055e-01,  1.4222e-01],
        [-1.0852e+00,  1.2374e-01,  6.1444e-02],
        [-7.3187e-01, -1.4731e-02, -9.5858e-02],
        [-7.4126e-01,  2.1228e-04,  1.9364e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.9038, -0.1929,  0.5467],
        [-1.0501,  0.0404,  0.1638],
        [-0.8228,  0.3117, -0.3240],
        [-0.8222,  0.1276, -0.0649],
        [-0.9402,  0.0507,  0.0525],
        [-0.8927,  0.2139, -0.1009],
        [-1.0245,  0.3807, -0.1662],
        [-0.9655,  0.3557, -0.2612],
        [-0.7679,  0.1714, -0.0684],
        [-0.8828,  0.2009, -0.0110],
        [-1.1173,  0.2624, -0.4072],
        [-0.9296,  0.1206, -0.1403]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.8802,  0.2767, -0.4085],
        [-0.9610,  0.0818, -0.1074],
        [-0.9202, -0.0728,  0.1390],
        [-0.9472, -0.0793,  0.0951],
        [-0.7699, -0.0133,  0.1168],
        [-0.9890, -0.0257,  0.2680],
        [-0.8292, -0.1693,  0.2455],
        [-0.6790, -0.1534,  0.3234],
        [-0.8124,  0.4429, -0.4444],
        [-0.7394, -0.0595,  0.1261],
        [-0.8973,  0.2587, -0.0640],
        [-0.8484,  0.0400,  0.0966]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.6985,  0.4658, -0.4339],
        [-0.9619, -0.0056, -0.0769],
        [-0.8793, -0.0497, -0.1629],
        [-0.5464,  0.0989, -0.4138],
        [-0.6860,  0.1946, -0.0131],
        [-0.8616,  0.1074, -0.1554],
        [-0.7955,  0.2544, -0.4314],
        [-0.7403,  0.1244, -0.2826],
        [-0.9617,  0.1331, -0.0504],
        [-0.7246,  0.2155, -0.1703],
        [-0.8633,  0.1094, -0.0416],
        [-0.8813,  0.1044, -0.1357]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.7150, -0.1837,  0.1748],
        [-0.8838,  0.0632, -0.0038],
        [-0.8235,  0.5230, -0.2558],
        [-0.8175, -0.0874,  0.1946],
        [-0.8275,  0.2668, -0.5328],
        [-0.6359,  0.1788, -0.2085],
        [-0.6570,  0.0542, -0.3546],
        [-0.8219,  0.1228, -0.2148],
        [-0.8694, -0.0529,  0.2884],
        [-0.6036, -0.1001,  0.0237],
        [-0.8429, -0.0674,  0.0924],
        [-0.7564,  0.1497, -0.0660]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.9019, -0.3720,  0.5097],
        [-0.7431, -0.6274,  0.5493],
        [-0.7710, -0.3107,  0.4977],
        [-0.8366, -0.3039,  0.2843],
        [-0.7200, -0.6225,  0.5444],
        [-0.8301, -0.3302,  0.3215],
        [-0.6437, -0.2491,  0.4704],
        [-0.8207, -0.2610, -0.0940],
        [-0.7155, -0.6036,  0.3733],
        [-0.6575, -0.2046,  0.1649],
        [-0.5120, -0.3998,  0.3857],
        [-0.8201, -0.0427, -0.0763]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.6595, -0.3436,  0.2312],
        [-0.5924, -0.0856,  0.0262],
        [-0.5906,  0.2374, -0.4028],
        [-0.5677, -0.5745,  0.1892],
        [-0.5493,  0.3615, -0.4671],
        [-0.7055, -0.2840,  0.2977],
        [-0.7397,  0.0401, -0.2864],
        [-0.7040, -0.3075,  0.2495],
        [-0.5549, -0.0115,  0.1574],
        [-0.5198, -0.1036,  0.0228],
        [-0.7065, -0.3822,  0.1757],
        [-0.7377,  0.4760, -0.6110]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #600: tensor([[-0.5495, -0.2707,  0.2712],
        [-0.8590, -0.4087,  0.3306],
        [-0.5182, -0.3565,  0.4575],
        [-0.5573, -0.0841,  0.3649],
        [-0.4884, -0.2504,  0.2092],
        [-0.7275,  0.4229, -0.5813],
        [-0.5166, -0.3480, -0.0114],
        [-0.4857,  0.0511, -0.2640],
        [-0.5474,  0.2384, -0.3949],
        [-0.6171, -0.1738, -0.2002],
        [-0.6363,  0.0837, -0.3255],
        [-0.5160, -0.0301, -0.0173]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #650: tensor([[-0.4270, -0.0923, -0.1506],
        [-0.4785,  0.0752, -0.4313],
        [-0.5226, -0.1119, -0.0902],
        [-0.3789,  0.0165, -0.1607],
        [-0.6144, -0.4189,  0.2164],
        [-0.5851, -0.2026,  0.2285],
        [-0.6668, -0.0421, -0.2156],
        [-0.5217, -0.3071,  0.0014],
        [-0.5730,  0.0942,  0.3112],
        [-0.6885, -0.4650,  0.4195],
        [-0.3988,  0.1415, -0.2831],
        [-0.4360, -0.1312, -0.2706]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #700: tensor([[-0.4182,  0.2830, -0.3581],
        [-0.4325, -0.0350, -0.4189],
        [-0.4247,  0.3921, -0.7775],
        [-0.4176, -0.1647, -0.1527],
        [-0.5644,  0.1937, -0.5450],
        [-0.3708, -0.0621, -0.2095],
        [-0.4953, -0.4087,  0.0940],
        [-0.5005, -0.0959, -0.0929],
        [-0.4346, -0.0497, -0.3479],
        [-0.4449, -0.0420, -0.4106],
        [-0.5142, -0.1429, -0.2320],
        [-0.4694, -0.4004,  0.1669]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #750: tensor([[-0.4437,  0.2550, -0.5135],
        [-0.3429,  0.1989, -0.6753],
        [-0.5916,  0.0553, -0.6459],
        [-0.5339,  0.0565, -0.5471],
        [-0.4377,  0.1780, -0.5366],
        [-0.4762, -0.7386,  0.5990],
        [-0.2958, -0.6960,  0.4598],
        [-0.5135, -0.4201,  0.2807],
        [-0.4074,  0.0290, -0.3918],
        [-0.5086, -0.3077,  0.0036],
        [-0.4578, -0.3215,  0.0849],
        [-0.5846,  0.1244, -0.5548]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #800: tensor([[-0.6009,  0.1473, -0.4533],
        [-0.4489, -0.1976, -0.4496],
        [-0.2055, -0.1804, -0.2623],
        [-0.4487, -0.0173, -0.5748],
        [-0.4787, -0.0655, -0.1447],
        [-0.5191, -0.1168, -0.5548],
        [-0.3798, -0.0764, -0.3346],
        [-0.3670, -0.3040,  0.0301],
        [-0.4765, -0.1550, -0.1923],
        [-0.6777, -0.1504, -0.5123],
        [-0.2285, -0.0760, -0.2941],
        [-0.4503,  0.2745, -0.8304]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #850: tensor([[-0.4002, -0.2814, -0.1330],
        [-0.3281, -0.1793, -0.1881],
        [-0.4471,  0.0572, -0.6483],
        [-0.2460,  0.3225, -0.7679],
        [-0.2780, -0.4092,  0.1909],
        [-0.3378, -0.3228, -0.1837],
        [-0.2655, -0.0100, -0.3412],
        [-0.4219, -0.1204, -0.3002],
        [-0.2542, -0.2112, -0.0503],
        [-0.2420, -0.0275, -0.2507],
        [-0.2583, -0.0206, -0.2853],
        [-0.2650, -0.3393,  0.1508]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #900: tensor([[-0.1361, -0.3391, -0.0530],
        [-0.4118, -0.2609, -0.0251],
        [-0.2567, -0.0471,  0.0629],
        [-0.6034, -0.2225, -0.0360],
        [-0.3144, -0.4434,  0.3135],
        [-0.2633, -0.2578,  0.0182],
        [-0.2606, -0.4237,  0.0687],
        [-0.3709, -0.2648, -0.0920],
        [-0.1577, -0.0695, -0.0377],
        [-0.3113, -0.0384, -0.3501],
        [-0.4284, -0.4640, -0.0152],
        [-0.4415, -0.4957,  0.0695]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #950: tensor([[-0.1245, -0.9982,  1.1674],
        [-0.4463, -1.0221,  0.8940],
        [-0.3244, -0.8948,  0.8602],
        [-0.1748, -0.8386,  0.7901],
        [-0.4011, -1.0163,  1.1886],
        [-0.2951, -0.7393,  0.7657],
        [-0.6389, -0.9861,  0.7948],
        [-0.3887, -0.8385,  0.4714],
        [-0.2684, -0.6783,  0.5428],
        [-0.5590, -0.8363,  0.7388],
        [-0.2810, -0.5252,  0.7649],
        [-0.3135, -0.9993,  0.8216]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1000: tensor([[-0.4502, -0.4413,  0.1192],
        [-0.2546, -0.6613,  0.9216],
        [-0.2902, -0.6253,  0.0322],
        [-0.1374, -0.2112, -0.0762],
        [-0.2029, -0.2629, -0.1525],
        [-0.2317, -0.6031,  0.5136],
        [-0.3497, -0.4680, -0.0089],
        [-0.2702, -0.4286,  0.3540],
        [-0.3329, -0.8432,  0.7030],
        [-0.2212, -0.6266,  0.2490],
        [-0.4330, -0.7052,  0.7690],
        [-0.4732, -0.9482,  0.4154]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1050: tensor([[-0.0580, -0.4397, -0.0497],
        [-0.2070, -0.1008, -0.0806],
        [-0.0604, -0.4992,  0.4463],
        [-0.1974, -0.3804,  0.0960],
        [-0.3169, -0.6217,  0.4922],
        [-0.2793, -0.5124,  0.3801],
        [-0.3546, -0.4335,  0.2511],
        [-0.1600, -0.4484,  0.1324],
        [-0.1737, -0.4754,  0.0183],
        [-0.3769, -0.5302,  0.3808],
        [-0.1911, -0.3879, -0.0865],
        [-0.3517, -0.5878,  0.1506]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1100: tensor([[-0.2309, -0.5942, -0.0323],
        [-0.1364, -0.2289, -0.1141],
        [-0.1525, -0.3719, -0.2949],
        [-0.0699, -0.2019, -0.1836],
        [-0.2241, -0.5750,  0.2215],
        [-0.0480, -0.2089, -0.1994],
        [-0.2483, -0.4702, -0.0796],
        [-0.2956, -0.3466, -0.1635],
        [-0.0553, -0.3459,  0.0080],
        [-0.1405, -0.4831,  0.2678],
        [-0.1911, -0.3787,  0.0863],
        [-0.0744, -0.2276, -0.2760]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1150: tensor([[-0.2269, -0.5147,  0.3569],
        [ 0.1089,  0.0327, -0.5154],
        [-0.3108, -0.4175, -0.0705],
        [-0.0489, -0.3458, -0.1130],
        [-0.1308, -0.3970,  0.1962],
        [-0.1035, -0.4957,  0.4834],
        [-0.3472, -0.7034,  0.2934],
        [-0.1421, -0.5470,  0.0032],
        [-0.1111, -0.4000, -0.0630],
        [-0.2629, -0.6150,  0.4099],
        [-0.2660, -0.4266,  0.1097],
        [-0.2582, -0.2776, -0.1933]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1200: tensor([[-0.2259, -0.3501,  0.1429],
        [-0.3157, -0.5356,  0.5188],
        [-0.1344, -0.3606,  0.1806],
        [-0.2854, -0.4979,  0.1083],
        [-0.1987, -0.4503,  0.0937],
        [ 0.0625, -0.2990, -0.1925],
        [-0.2516, -0.5603, -0.0804],
        [-0.1783, -0.2905, -0.1169],
        [-0.3416, -0.6019,  0.4908],
        [-0.3657, -0.6811,  0.2673],
        [-0.1766, -0.2903,  0.1095],
        [-0.0670, -0.2225, -0.2004]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1250: tensor([[-0.1436, -0.5277, -0.0749],
        [-0.2071, -0.5051,  0.2352],
        [-0.0302, -0.4209,  0.0926],
        [ 0.1758, -0.0909, -0.3590],
        [-0.2902, -0.3960, -0.1861],
        [-0.2604, -0.3309,  0.1678],
        [-0.1567, -0.5378,  0.0138],
        [-0.0424, -0.2807,  0.0535],
        [-0.3584, -0.4406,  0.1315],
        [-0.1129, -0.2797, -0.0631],
        [-0.4440, -0.7279,  0.7130],
        [-0.3597, -0.3323,  0.1730]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1300: tensor([[-0.1228, -0.3410, -0.2875],
        [-0.0209, -0.2004, -0.2318],
        [ 0.0058, -0.1148, -0.1669],
        [-0.2333, -0.2316,  0.0178],
        [ 0.0433, -0.0192, -0.6868],
        [-0.1620, -0.4673,  0.2046],
        [-0.1911, -0.4637,  0.1091],
        [-0.3494, -0.5440,  0.2339],
        [-0.0257, -0.3103, -0.0984],
        [-0.1658, -0.3965, -0.0599],
        [-0.1627, -0.4503,  0.0007],
        [-0.2270, -0.6007,  0.4296]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1350: tensor([[-0.2775, -0.4352,  0.4633],
        [-0.4099, -0.7351,  0.6280],
        [-0.2921, -0.2520, -0.1693],
        [-0.1197, -0.2386, -0.0853],
        [ 0.0819, -0.0803, -0.6435],
        [ 0.0178, -0.2891, -0.2249],
        [-0.0949, -0.2588, -0.4083],
        [-0.1225, -0.3576, -0.0388],
        [-0.2067, -0.1747, -0.2747],
        [-0.1769, -0.2460, -0.1886],
        [-0.1030, -0.1878, -0.3135],
        [-0.3307, -0.2587,  0.0238]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1400: tensor([[-0.2147, -0.4381, -0.0032],
        [-0.1365, -0.3763, -0.2355],
        [-0.1976, -0.4544,  0.4855],
        [-0.3242, -0.6104,  0.3797],
        [-0.3141, -0.4827,  0.1442],
        [-0.2461, -0.5541,  0.2310],
        [-0.2731, -0.4109,  0.5665],
        [-0.1855, -0.5347,  0.2657],
        [-0.3317, -0.4217,  0.4080],
        [-0.2636, -0.4132,  0.2332],
        [-0.2641, -0.6447,  0.1466],
        [-0.4654, -0.4233,  0.4523]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1450: tensor([[-8.7167e-02, -3.3578e-01, -1.0998e-02],
        [-1.4075e-01, -3.4046e-01, -8.1558e-02],
        [-5.4615e-01, -6.0586e-01,  3.5373e-01],
        [-1.6938e-01, -2.7378e-01, -5.3434e-02],
        [-4.0617e-02, -1.8044e-01, -2.5433e-01],
        [ 6.8245e-04, -1.6329e-01, -3.2177e-01],
        [-9.1896e-02, -2.2530e-01, -2.7373e-01],
        [ 8.3613e-02, -1.2979e-01, -8.4076e-01],
        [-8.8163e-02, -2.5321e-01, -2.9557e-01],
        [ 2.1936e-02, -2.5426e-01, -6.6492e-01],
        [-5.7751e-02,  3.1116e-02, -8.5997e-01],
        [-1.0100e-01, -2.9195e-01, -4.3939e-02]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #1500: tensor([[-0.1115, -0.1439,  0.0876],
        [-0.1765, -0.2817,  0.1642],
        [-0.3671, -0.3284, -0.0273],
        [ 0.0315, -0.1582, -0.3268],
        [-0.3149, -0.3199, -0.1684],
        [-0.2996, -0.2834, -0.3447],
        [-0.1164, -0.1713, -0.6046],
        [-0.2804, -0.3978,  0.0843],
        [-0.2603, -0.0427, -0.2745],
        [-0.1283, -0.3512, -0.4304],
        [-0.0722, -0.2674, -0.1912],
        [-0.2415, -0.3430, -0.2362]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1550: tensor([[-0.1996, -0.2965, -0.0800],
        [-0.0995, -0.2478, -0.4179],
        [-0.3789, -0.4240,  0.2477],
        [-0.0732, -0.0626, -0.7208],
        [-0.2554, -0.3318, -0.0540],
        [-0.3159, -0.2267, -0.0595],
        [-0.2371, -0.2869, -0.0353],
        [-0.1976, -0.3591,  0.2439],
        [-0.0477, -0.2904,  0.0128],
        [-0.2264, -0.3842,  0.1538],
        [ 0.1567, -0.0257, -0.7963],
        [-0.3408, -0.2498,  0.0414]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1600: tensor([[-0.2811, -0.2606, -0.0362],
        [-0.0933, -0.0923, -0.3828],
        [-0.5725, -0.5286,  0.5976],
        [-0.5340, -0.4534,  0.3402],
        [-0.4776, -0.4531,  0.1094],
        [-0.1348, -0.1152, -0.2452],
        [ 0.1382,  0.0975, -0.6828],
        [ 0.2656,  0.2314, -1.1470],
        [-0.5326, -0.5402,  0.5914],
        [-0.2581, -0.4357,  0.0445],
        [-0.6906, -0.6352,  0.6717],
        [-0.6974, -0.7390,  0.8504]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1650: tensor([[ 0.0276, -0.0640, -0.7080],
        [ 0.1216,  0.0420, -0.8753],
        [-0.0935, -0.0865, -0.5691],
        [-0.0948, -0.1749, -0.2703],
        [-0.1365, -0.3621, -0.0425],
        [-0.2329, -0.1614, -0.1070],
        [ 0.0177,  0.0062, -0.7158],
        [-0.1480, -0.2159, -0.0926],
        [ 0.0319,  0.0274, -0.6871],
        [-0.1039, -0.2489, -0.3442],
        [ 0.1103, -0.1102, -0.5394],
        [-0.3105, -0.3931,  0.0170]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1700: tensor([[-0.2661, -0.0641, -0.1573],
        [-0.3379, -0.4075, -0.1873],
        [-0.2029, -0.2030, -0.3573],
        [-0.2105, -0.3075,  0.1157],
        [-0.1467, -0.0473, -0.3525],
        [-0.3934, -0.4579,  0.3422],
        [-0.4694, -0.3970,  0.2238],
        [-0.5243, -0.5061,  0.3078],
        [-0.4443, -0.5102,  0.4492],
        [-0.2608, -0.2487, -0.0872],
        [-0.2274, -0.2278, -0.1773],
        [-0.0181, -0.2372, -0.2186]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1750: tensor([[-0.2561, -0.1737, -0.1781],
        [-0.0939, -0.2006, -0.3975],
        [-0.3975, -0.4550,  0.1040],
        [-0.0988, -0.0204, -0.3826],
        [-0.0424, -0.1462, -0.2677],
        [-0.1223, -0.1312,  0.0077],
        [-0.2963, -0.3412,  0.2809],
        [-0.0813, -0.1270, -0.4580],
        [ 0.1169, -0.0126, -0.8338],
        [-0.1672, -0.2670, -0.4183],
        [-0.3372, -0.3416,  0.2243],
        [-0.1501, -0.1794, -0.1304]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1800: tensor([[-0.1633, -0.2061, -0.3124],
        [-0.4143, -0.3508,  0.0696],
        [-0.0063, -0.0868, -0.3636],
        [-0.1315, -0.2885, -0.3903],
        [-0.0343,  0.0372, -0.3988],
        [-0.1858, -0.1707, -0.0948],
        [-0.1529, -0.0260, -0.4146],
        [-0.2048, -0.2417, -0.0762],
        [-0.0343, -0.1822, -0.3487],
        [-0.1433, -0.1432, -0.5462],
        [ 0.0814, -0.0944, -0.5851],
        [-0.0189, -0.1264, -0.3384]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1850: tensor([[ 0.0925,  0.0043, -0.5212],
        [-0.1341, -0.0850, -0.2843],
        [-0.0184,  0.0485, -0.4081],
        [-0.2360, -0.3168,  0.1132],
        [-0.2114, -0.2705, -0.2328],
        [-0.2445, -0.2278, -0.0653],
        [-0.0636, -0.2224, -0.3694],
        [-0.0437, -0.0177, -0.3803],
        [-0.4793, -0.3761,  0.1958],
        [-0.1712, -0.1090, -0.2736],
        [-0.3176, -0.1235,  0.0204],
        [-0.1092, -0.1712, -0.1455]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1900: tensor([[-0.2542,  0.0069, -0.1373],
        [-0.4456, -0.4555,  0.0665],
        [-0.2804, -0.2233, -0.1432],
        [-0.0010, -0.0164, -0.4526],
        [-0.0863, -0.1281, -0.5906],
        [-0.1744, -0.2063, -0.2487],
        [-0.2866, -0.1716, -0.3046],
        [-0.4142, -0.2478, -0.0882],
        [-0.4765, -0.4089,  0.2563],
        [-0.1565, -0.1134, -0.2994],
        [-0.0797, -0.1628, -0.5222],
        [-0.0888, -0.1442,  0.0231]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1950: tensor([[-2.5873e-01, -2.6745e-01, -1.5762e-01],
        [-2.1951e-01, -1.8313e-01, -4.9315e-01],
        [-1.0362e-01, -8.9861e-02, -5.1414e-01],
        [-1.3998e-01, -2.1823e-01, -4.3074e-01],
        [-2.1053e-01, -2.6605e-01, -3.8630e-01],
        [-3.2777e-01, -2.7535e-01, -6.4544e-02],
        [-1.1358e-01, -8.1691e-02, -5.4884e-01],
        [-1.1424e-01, -2.5280e-01, -1.3484e-02],
        [-1.3041e-01, -1.5840e-04, -5.0247e-01],
        [-4.2514e-02,  1.8282e-02, -6.0034e-01],
        [-2.1612e-01, -2.6039e-01, -3.2686e-01],
        [-1.8159e-01, -1.3137e-01, -5.4448e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #2000: tensor([[-0.3072, -0.3163, -0.3196],
        [-0.4329, -0.3343,  0.1616],
        [-0.3879, -0.3205,  0.1944],
        [-0.4130, -0.3634, -0.0560],
        [-0.1837, -0.2255, -0.4669],
        [-0.2111, -0.2460, -0.3381],
        [ 0.0934,  0.0859, -0.8255],
        [-0.1070, -0.1180, -0.2796],
        [-0.2147, -0.2389, -0.2801],
        [-0.0891, -0.1227, -0.3285],
        [-0.3075, -0.2529, -0.0713],
        [ 0.0068, -0.1795, -0.6185]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2050: tensor([[-0.2509, -0.2202, -0.4166],
        [-0.1349, -0.1978, -0.4674],
        [-0.3985, -0.3834,  0.3128],
        [-0.5023, -0.3715,  0.0220],
        [-0.5108, -0.3249, -0.0418],
        [-0.3479, -0.2981,  0.0320],
        [-0.3410, -0.3215, -0.1611],
        [-0.4472, -0.4401, -0.0408],
        [-0.2246, -0.2979, -0.0520],
        [-0.2157, -0.2477, -0.1217],
        [-0.2216, -0.1403, -0.2515],
        [-0.0086, -0.1562, -0.2730]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2100: tensor([[-0.0361, -0.0323, -0.4508],
        [-0.0236, -0.0921, -0.3805],
        [ 0.0324,  0.0698, -0.6969],
        [-0.2079, -0.2209, -0.0430],
        [-0.2891, -0.3157, -0.0475],
        [-0.0740, -0.0169, -0.5565],
        [-0.2443, -0.3261,  0.1024],
        [-0.3458, -0.2455, -0.1340],
        [-0.5695, -0.5788,  0.4260],
        [-0.0991, -0.1784, -0.4443],
        [-0.2617, -0.1677, -0.3847],
        [-0.3185, -0.2219, -0.2448]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2150: tensor([[-5.7888e-01, -5.0595e-01,  1.0034e-01],
        [-2.7137e-01, -4.3035e-01,  1.6294e-01],
        [-3.5817e-01, -3.1481e-01,  6.1707e-02],
        [-2.7743e-01, -2.0550e-01, -1.8991e-01],
        [-7.4099e-02, -4.9043e-02, -3.1205e-01],
        [-3.2655e-01, -3.4064e-01, -1.5653e-01],
        [-1.6030e-01, -2.6000e-01, -2.0337e-01],
        [-2.4502e-01, -2.8339e-01, -3.8286e-02],
        [-6.8358e-02, -5.7633e-02, -4.0809e-01],
        [ 4.6535e-04, -8.5037e-02, -3.5821e-01],
        [-5.3161e-01, -3.6324e-01,  1.6277e-01],
        [-1.7106e-01, -2.9128e-01, -1.6644e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #2200: tensor([[-0.2318, -0.2631, -0.2684],
        [-0.2885, -0.1977, -0.1722],
        [-0.1662, -0.1498, -0.4270],
        [ 0.0991,  0.0085, -0.6989],
        [-0.1788, -0.3531, -0.1619],
        [-0.2300, -0.2578, -0.2925],
        [-0.1889, -0.2077, -0.2553],
        [-0.3966, -0.4527,  0.0483],
        [-0.1250, -0.0639, -0.4012],
        [-0.3679, -0.2764, -0.1075],
        [-0.0735,  0.0812, -0.5223],
        [-0.2482, -0.1924, -0.2836]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2250: tensor([[-0.4855, -0.5129,  0.3168],
        [-0.4817, -0.3558,  0.1805],
        [-0.5843, -0.5224,  0.4733],
        [-0.5424, -0.5158,  0.4296],
        [-0.3697, -0.3294, -0.0281],
        [-0.2126, -0.2762, -0.2976],
        [-0.3771, -0.2640,  0.0902],
        [-0.3859, -0.3436,  0.0578],
        [-0.3968, -0.3358,  0.0362],
        [-0.4877, -0.4116,  0.0427],
        [ 0.0634,  0.0511, -0.8193],
        [ 0.0051, -0.0578, -0.6834]], device='cuda:0', grad_fn=<AddmmBackward>)
