Iter #50: tensor([[ 0.0281, -0.4635,  0.2568],
        [ 0.0178, -0.5776,  0.1647],
        [ 0.0678, -0.5442,  0.1662],
        [-0.0266, -0.5261,  0.0531],
        [ 0.0866, -0.5114,  0.3274],
        [ 0.2555, -0.5033,  0.3652],
        [-0.0786, -0.7647,  0.4747],
        [ 0.0423, -0.5728,  0.2504],
        [-0.0762, -0.7380,  0.6547],
        [ 0.1485, -0.5384,  0.3785],
        [ 0.1209, -0.7451,  0.5840],
        [ 0.2622, -0.4637,  0.4995]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[ 0.0539, -0.6556,  0.3560],
        [ 0.0856, -0.7051,  0.2300],
        [ 0.1170, -0.6920,  0.3225],
        [-0.0628, -0.6494,  0.3886],
        [ 0.0774, -0.7219,  0.7171],
        [ 0.0272, -0.7967,  0.5916],
        [-0.0600, -0.8240,  0.5327],
        [-0.0256, -0.6497,  0.4226],
        [-0.0041, -0.7154,  0.4636],
        [-0.0731, -0.5343,  0.3770],
        [-0.2467, -0.4897,  0.5914],
        [ 0.0662, -0.8635,  0.5869]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.0938, -0.9316,  0.4823],
        [ 0.0341, -0.8534,  0.4555],
        [ 0.0498, -0.8234,  0.5860],
        [-0.0125, -0.7817,  0.4516],
        [ 0.0462, -0.8319,  0.4173],
        [ 0.2526, -0.6442,  0.4414],
        [ 0.2760, -0.7319,  0.4339],
        [ 0.0991, -0.7812,  0.3111],
        [-0.0929, -0.9521,  0.6396],
        [ 0.0592, -0.8036,  0.2500],
        [ 0.2557, -0.7493,  0.3278],
        [ 0.0980, -0.9472,  0.2589]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[ 0.1200, -0.7491,  0.2963],
        [ 0.0953, -0.8613,  0.3174],
        [ 0.3854, -0.7748,  0.4192],
        [ 0.1655, -0.8023,  0.6046],
        [ 0.1119, -0.9675,  0.2932],
        [-0.0192, -1.1462,  0.4886],
        [ 0.3165, -0.7937,  0.3363],
        [ 0.0070, -0.7089,  0.3422],
        [ 0.1440, -0.9114,  0.3511],
        [ 0.1201, -0.9067,  0.5206],
        [ 0.1985, -0.9853,  0.7093],
        [ 0.2876, -0.9152,  0.2786]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.0175, -0.8329,  0.3843],
        [ 0.1096, -0.7647,  0.0268],
        [-0.1067, -0.9948,  0.6032],
        [ 0.2693, -0.6493, -0.0298],
        [ 0.1547, -0.8648,  0.2901],
        [ 0.0322, -0.6906,  0.2425],
        [-0.0809, -0.8328,  0.5899],
        [-0.0146, -0.9638,  0.3868],
        [ 0.2442, -0.7694,  0.1228],
        [ 0.0705, -0.6991,  0.2466],
        [ 0.2075, -0.8532,  0.1686],
        [ 0.0312, -0.8819,  0.2424]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.0272, -0.8773,  0.3572],
        [-0.0173, -0.7509,  0.5776],
        [ 0.1533, -0.6873,  0.0672],
        [ 0.1678, -0.7426,  0.3297],
        [ 0.0457, -0.7457,  0.3644],
        [ 0.2921, -0.6695,  0.0085],
        [ 0.0462, -0.6671,  0.2037],
        [ 0.0623, -0.6946,  0.4577],
        [-0.0076, -0.7293,  0.4227],
        [ 0.0302, -0.5896,  0.0796],
        [ 0.0994, -0.7067,  0.2782],
        [ 0.0031, -0.7579,  0.3513]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[ 0.1122, -0.6216,  0.1480],
        [ 0.1645, -0.7423,  0.2717],
        [ 0.0844, -0.6787,  0.3174],
        [ 0.1239, -0.6927,  0.0533],
        [ 0.2393, -0.5310, -0.1694],
        [ 0.2192, -0.8260, -0.1256],
        [ 0.2175, -0.5477,  0.0918],
        [ 0.2138, -0.7588, -0.0403],
        [ 0.2708, -0.7457, -0.0929],
        [ 0.2074, -0.6592,  0.0741],
        [ 0.4760, -0.6333, -0.0647],
        [ 0.1005, -0.8367,  0.0994]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.0086, -0.6774,  0.0163],
        [ 0.1689, -0.7926,  0.0093],
        [ 0.2589, -0.6497,  0.1681],
        [ 0.1173, -0.5794, -0.0516],
        [ 0.1403, -0.5687,  0.2192],
        [ 0.0618, -0.6924, -0.0203],
        [ 0.2252, -0.6515, -0.0365],
        [ 0.1684, -0.6429,  0.1112],
        [-0.3301, -0.7536,  0.8122],
        [-0.2874, -0.6241,  0.6148],
        [ 0.0698, -0.6105,  0.2462],
        [ 0.2140, -0.7099, -0.2243]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[ 0.1585, -0.4913, -0.2956],
        [ 0.0722, -0.4404,  0.0714],
        [ 0.1697, -0.5673,  0.0491],
        [ 0.2732, -0.4761, -0.0840],
        [-0.0536, -0.6367,  0.1185],
        [ 0.0850, -0.5240, -0.0071],
        [-0.0701, -0.6570,  0.0263],
        [ 0.0376, -0.4476,  0.0863],
        [ 0.2045, -0.6307,  0.0285],
        [-0.3433, -0.6454,  0.3405],
        [ 0.0061, -0.4745,  0.1304],
        [ 0.2454, -0.4667, -0.3301]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[ 0.0058, -0.2081,  0.1789],
        [ 0.1417, -0.5015, -0.0142],
        [ 0.0703, -0.4110, -0.2304],
        [ 0.0613, -0.5300,  0.0186],
        [-0.0166, -0.5186,  0.1136],
        [-0.3067, -0.5144,  0.2224],
        [ 0.1456, -0.3228, -0.1588],
        [-0.2323, -0.5066,  0.3771],
        [-0.0951, -0.6002,  0.1242],
        [ 0.0274, -0.6443, -0.0172],
        [ 0.0095, -0.2293, -0.0922],
        [ 0.3403, -0.3994, -0.2161]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.1889, -0.5617,  0.2011],
        [-0.0254, -0.4813, -0.1128],
        [ 0.2154, -0.3704,  0.0983],
        [ 0.0656, -0.4854, -0.2237],
        [-0.0291, -0.4951, -0.0799],
        [ 0.1458, -0.3959,  0.0727],
        [ 0.1177, -0.3597, -0.1074],
        [ 0.2986, -0.4637,  0.0057],
        [-0.0815, -0.5944,  0.0654],
        [ 0.1871, -0.5360,  0.0293],
        [-0.0350, -0.4052,  0.1343],
        [-0.1428, -0.4991,  0.0940]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #600: tensor([[ 0.0389, -0.3292,  0.0158],
        [-0.0574, -0.5767,  0.2668],
        [-0.1432, -0.5366,  0.1843],
        [ 0.0064, -0.5224, -0.0669],
        [ 0.0635, -0.4341, -0.0501],
        [ 0.1436, -0.3101, -0.2674],
        [ 0.1941, -0.4403, -0.0097],
        [-0.2012, -0.3282,  0.1706],
        [-0.0111, -0.4062,  0.0282],
        [-0.1019, -0.3141, -0.1295],
        [-0.1999, -0.6535,  0.0258],
        [ 0.2800, -0.4449, -0.0846]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #650: tensor([[-0.2844, -0.4333,  0.3303],
        [-0.0430, -0.3928,  0.0795],
        [-0.4935, -0.2936,  0.4903],
        [ 0.1921, -0.3179, -0.0530],
        [-0.0475, -0.3737, -0.2093],
        [ 0.1951, -0.2963, -0.2520],
        [ 0.2466, -0.3885, -0.3649],
        [ 0.2876, -0.2237, -0.0915],
        [-0.1541, -0.4482,  0.2511],
        [ 0.0790, -0.3419, -0.3125],
        [-0.2393, -0.5023, -0.0138],
        [ 0.0574, -0.1944,  0.0280]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #700: tensor([[ 0.1403, -0.3585, -0.3765],
        [-0.2361, -0.4459, -0.0047],
        [-0.0030, -0.4783, -0.1006],
        [ 0.0202, -0.2925, -0.1591],
        [ 0.0641, -0.4109, -0.0135],
        [-0.0560, -0.2295,  0.0173],
        [ 0.0124, -0.4180,  0.1301],
        [-0.7855, -0.5085,  0.7338],
        [-0.2021, -0.3457,  0.0320],
        [ 0.0457, -0.1462, -0.2161],
        [ 0.2293, -0.3501, -0.4538],
        [-0.1511, -0.4005, -0.2143]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #750: tensor([[ 0.0135, -0.2946, -0.0299],
        [-0.1027, -0.3740, -0.0643],
        [-0.3660, -0.4940,  0.4156],
        [ 0.2717, -0.3368, -0.2779],
        [-0.2714, -0.3190,  0.2345],
        [-0.1341, -0.2567,  0.0961],
        [ 0.1250, -0.3765, -0.2887],
        [-0.0016, -0.3304, -0.2096],
        [-0.1549, -0.3890,  0.1767],
        [-0.0890, -0.3300, -0.1374],
        [-0.1694, -0.2897, -0.3816],
        [ 0.2622, -0.2807, -0.3883]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #800: tensor([[-5.8491e-01, -3.8522e-01,  7.2382e-01],
        [-9.0037e-02, -3.3804e-01, -1.1607e-01],
        [-3.6366e-01, -2.0460e-01,  1.4429e-01],
        [-4.2135e-01, -3.2105e-01,  4.5465e-01],
        [-1.4642e-01, -2.9847e-01, -1.1384e-02],
        [-3.3416e-01, -3.9859e-01,  5.5125e-02],
        [-4.5822e-01, -2.4537e-01,  1.8321e-01],
        [-3.2183e-01, -3.4898e-01, -1.6198e-01],
        [ 4.4081e-02, -3.0595e-01, -1.6750e-01],
        [ 1.4071e-02, -2.7574e-01, -1.1660e-01],
        [ 1.1384e-01, -4.7186e-01,  5.0532e-04],
        [-2.9796e-01, -3.0359e-01,  2.2950e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #850: tensor([[ 0.0373, -0.3181, -0.3450],
        [ 0.0914, -0.1298, -0.3426],
        [-0.1851, -0.1884,  0.0477],
        [ 0.0272, -0.1040, -0.3059],
        [-0.1226, -0.3604, -0.0604],
        [ 0.2716, -0.1458, -0.5174],
        [-0.7399, -0.4984,  0.6567],
        [ 0.1101, -0.1752, -0.4289],
        [-0.7068, -0.4330,  0.7892],
        [-0.6884, -0.4539,  0.6636],
        [-0.8818, -0.4562,  0.8088],
        [ 0.1831, -0.0913, -0.4448]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #900: tensor([[-3.3827e-01, -2.2522e-01,  1.6476e-01],
        [-5.8041e-01, -3.1904e-01,  3.2510e-01],
        [-4.4709e-01, -2.8290e-01,  1.7764e-01],
        [-4.6099e-01, -3.5646e-01,  1.6067e-01],
        [-5.4898e-01, -4.8927e-01,  4.7207e-01],
        [-4.7679e-02, -2.8149e-02, -1.2184e-01],
        [-4.7952e-01, -3.3179e-01,  2.0840e-01],
        [-3.5155e-01, -3.3141e-01,  2.3114e-02],
        [-3.5421e-01, -2.6269e-01,  3.0823e-01],
        [-1.9726e-02, -1.5458e-01, -1.5893e-01],
        [-6.8574e-02, -2.4254e-01, -5.0146e-03],
        [-4.9129e-01, -2.1187e-01,  4.5314e-04]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #950: tensor([[-0.2407, -0.2923, -0.1470],
        [-0.4116, -0.2858,  0.3458],
        [ 0.2036, -0.1867, -0.0719],
        [-0.0824, -0.1472, -0.1084],
        [-0.6245, -0.4696,  0.8226],
        [-0.2317, -0.2386,  0.0303],
        [-0.3252, -0.0612, -0.0937],
        [-0.5429, -0.3865,  0.2007],
        [-0.1993, -0.2683,  0.0307],
        [-0.2382, -0.1526, -0.0987],
        [-0.2355, -0.1914, -0.0547],
        [-0.9872, -0.4914,  0.8857]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1000: tensor([[-0.3584, -0.3138,  0.0846],
        [-0.1899, -0.1058,  0.0118],
        [-0.1045,  0.0323, -0.6346],
        [-0.3054, -0.1631, -0.2811],
        [-0.4482, -0.3601,  0.1738],
        [ 0.0354, -0.0614, -0.4459],
        [-0.3796, -0.3013,  0.1591],
        [-0.1692,  0.0138, -0.3020],
        [-0.1509, -0.1202, -0.0306],
        [-0.2875, -0.1833, -0.1073],
        [-0.3060, -0.1714,  0.1722],
        [-0.2536, -0.2932, -0.0049]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1050: tensor([[-0.2793, -0.2099,  0.1626],
        [-0.3147, -0.2958,  0.4410],
        [-0.2161, -0.1615,  0.0088],
        [-0.3586, -0.3522,  0.4915],
        [-0.0330, -0.0422, -0.1415],
        [-0.7288, -0.5517,  0.6245],
        [-0.2740, -0.2634, -0.2325],
        [-0.3236, -0.1404, -0.0152],
        [-0.1380, -0.0059,  0.2057],
        [-0.2317, -0.0719,  0.1380],
        [-0.3122, -0.2212, -0.1400],
        [-0.3801, -0.2894,  0.0859]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1100: tensor([[-0.5671, -0.3146,  0.5094],
        [-0.2208, -0.1496, -0.2175],
        [-0.0933, -0.1691,  0.0042],
        [-0.5477, -0.3743,  0.3281],
        [-0.6208, -0.2125,  0.3947],
        [-0.1912, -0.2304, -0.0230],
        [-0.4330, -0.2854,  0.3038],
        [-0.4669, -0.1865,  0.0852],
        [-0.7313, -0.3477,  0.4114],
        [-0.5376, -0.4107,  0.4564],
        [-0.3202, -0.1927,  0.1446],
        [-0.4499, -0.0826, -0.1186]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1150: tensor([[-0.6225, -0.4373,  1.0440],
        [-0.5423, -0.1516,  0.0906],
        [-0.4219, -0.2470, -0.0128],
        [-0.1522, -0.1765, -0.0220],
        [-0.3423, -0.1858, -0.0483],
        [ 0.0587, -0.0091, -0.2434],
        [-0.3904, -0.1456, -0.1987],
        [-0.2775, -0.0325, -0.2252],
        [-0.4446, -0.3774,  0.2556],
        [-0.1709, -0.2799, -0.2116],
        [-0.1265, -0.1106, -0.1571],
        [-0.3812, -0.3607, -0.1425]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1200: tensor([[ 0.1653,  0.1538, -0.4945],
        [-0.2312, -0.1000, -0.0773],
        [-0.3393, -0.1564, -0.0133],
        [-0.2950, -0.0696, -0.0092],
        [-0.3783, -0.1805, -0.0155],
        [-0.2928, -0.1196,  0.1019],
        [-0.1303,  0.0289, -0.2794],
        [-0.5783, -0.3768,  0.2321],
        [-0.3557, -0.1808, -0.0449],
        [-0.0195,  0.0218, -0.4800],
        [-0.3144,  0.0164, -0.1043],
        [-0.7263, -0.5304,  0.8754]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1250: tensor([[ 0.0432,  0.1466, -0.6779],
        [-0.7940, -0.7740,  1.1351],
        [-0.2909, -0.1600, -0.0303],
        [-0.4882, -0.0847,  0.1321],
        [-0.1514,  0.0016, -0.2785],
        [-0.2486, -0.0512,  0.3425],
        [-0.2107, -0.0316,  0.0201],
        [-0.3955, -0.2460,  0.4111],
        [-0.3942, -0.1618,  0.1042],
        [-0.2557, -0.1393,  0.0836],
        [-0.3047, -0.1304,  0.0082],
        [-0.2006, -0.1193, -0.2721]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1300: tensor([[-0.0665,  0.0030, -0.5770],
        [-0.2649, -0.0032, -0.2702],
        [ 0.0317,  0.1484, -0.5403],
        [-0.3300,  0.0230, -0.1154],
        [-0.4123, -0.2082,  0.1663],
        [-0.3724, -0.2726, -0.0037],
        [-0.6293, -0.4371,  0.3013],
        [-0.0340,  0.0665, -0.4647],
        [-0.2263, -0.0378,  0.0931],
        [-0.1408, -0.0094, -0.4246],
        [-0.4675, -0.1283,  0.0749],
        [-0.4871, -0.2981,  0.1492]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1350: tensor([[-0.1105,  0.0867, -0.1821],
        [-0.4246, -0.3721,  0.2730],
        [-0.5005, -0.3106, -0.0725],
        [-0.0040,  0.1988, -0.4960],
        [-0.4109, -0.4611,  0.2316],
        [-0.4725, -0.4568,  0.4977],
        [-0.1633, -0.0467,  0.0599],
        [-0.3515, -0.2166, -0.0458],
        [-0.1581, -0.0212, -0.4577],
        [-0.1655,  0.1446, -0.4177],
        [-0.2451, -0.1805, -0.0063],
        [-0.4850, -0.3615,  0.0481]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1400: tensor([[-0.3610, -0.4316,  0.3643],
        [-0.2701, -0.1750,  0.1172],
        [-0.1737,  0.0780, -0.0831],
        [-0.3439, -0.2092, -0.0885],
        [-0.2740, -0.1796,  0.2597],
        [-0.3429, -0.0879, -0.1416],
        [ 0.0049,  0.0686, -0.3589],
        [-0.1057,  0.1902, -0.4379],
        [-0.0637,  0.2463, -0.4195],
        [-0.1765, -0.0240, -0.1779],
        [-0.2982, -0.1098, -0.3256],
        [-0.3949, -0.3811,  0.4395]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1450: tensor([[-1.3689e-01,  1.0369e-01, -3.7943e-01],
        [ 1.7917e-02,  2.7765e-02, -4.7217e-01],
        [ 9.8543e-05,  2.6406e-01, -5.6281e-01],
        [-1.7224e-01, -5.1258e-03, -4.7549e-01],
        [-2.6907e-01, -7.8141e-02, -3.9633e-01],
        [-2.2982e-01, -1.4476e-01, -3.3772e-01],
        [ 2.0752e-02, -6.1854e-02, -5.6180e-01],
        [-1.1742e-01,  6.6506e-02, -5.3058e-01],
        [-1.9352e-01,  2.2952e-02, -8.5427e-02],
        [-2.6135e-01,  4.6106e-02, -1.8945e-01],
        [-2.6267e-01, -9.0423e-02,  1.0956e-02],
        [ 7.0774e-03, -1.5207e-02, -2.2917e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #1500: tensor([[-0.4019, -0.1263,  0.0341],
        [-0.7569, -0.6349,  1.0287],
        [-0.2366, -0.2514, -0.1943],
        [-0.0563,  0.0751, -0.3302],
        [-0.0340, -0.1188, -0.3895],
        [-0.1783,  0.1447, -0.4381],
        [ 0.0141,  0.1444, -0.4217],
        [-0.0365, -0.0121, -0.2431],
        [-0.3485, -0.1583, -0.0621],
        [-0.2353, -0.2667, -0.0957],
        [-0.1360,  0.1326, -0.2577],
        [-0.2839, -0.3608,  0.1303]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1550: tensor([[-0.1217, -0.1514,  0.1256],
        [-0.1306,  0.1016, -0.2296],
        [-0.2966, -0.2011,  0.0737],
        [-0.0902, -0.0451, -0.5306],
        [-0.1077,  0.1025, -0.2676],
        [-0.2429, -0.0917,  0.1620],
        [-0.1544, -0.0784, -0.0394],
        [-0.5476, -0.5277,  0.7220],
        [-0.3726, -0.4229,  0.4094],
        [-0.2949, -0.3816,  0.3040],
        [ 0.0620,  0.2250, -0.5881],
        [-0.1258, -0.1368,  0.0950]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1600: tensor([[-0.2557, -0.0862, -0.2275],
        [-0.0835,  0.0976, -0.3457],
        [-0.1862, -0.1359, -0.4752],
        [ 0.0091, -0.0052, -0.2619],
        [-0.2210, -0.1293, -0.3246],
        [-0.1113,  0.0098,  0.0613],
        [-0.0612,  0.0985, -0.0580],
        [ 0.0191,  0.0972, -0.2517],
        [-0.0399, -0.0579, -0.3544],
        [-0.0279,  0.0635, -0.4534],
        [-0.2444,  0.0669, -0.3921],
        [-0.0944,  0.0455, -0.3504]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1650: tensor([[-0.0956,  0.1151, -0.1318],
        [-0.1913, -0.3137,  0.2825],
        [-0.3284, -0.3918,  0.2488],
        [-0.2287, -0.2034,  0.2028],
        [-0.2404, -0.3030,  0.1368],
        [-0.1666, -0.0494,  0.0293],
        [-0.4556, -0.3983,  0.5145],
        [-0.1817, -0.1991,  0.0614],
        [-0.0844, -0.1800, -0.0251],
        [-0.1071, -0.0929, -0.1607],
        [-0.2086, -0.2562,  0.1642],
        [-0.1477,  0.0619, -0.2306]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1700: tensor([[ 0.1160,  0.0080, -0.2466],
        [-0.2921, -0.1327, -0.1062],
        [-0.3837, -0.2510,  0.2276],
        [-0.1275, -0.1173, -0.1691],
        [-0.4613, -0.4713,  0.4852],
        [-0.2731, -0.3124, -0.0101],
        [-0.1513, -0.0608, -0.1761],
        [ 0.0723,  0.1634, -0.2072],
        [-0.3719, -0.4115,  0.2842],
        [-0.2198, -0.2717,  0.1582],
        [-0.0296,  0.0085, -0.3967],
        [-0.3627, -0.4027,  0.3479]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1750: tensor([[-0.2577, -0.1863,  0.2449],
        [-0.2146, -0.2639,  0.1873],
        [-0.1455, -0.1938, -0.0481],
        [-0.2025, -0.2555,  0.1631],
        [-0.1071,  0.0705,  0.0051],
        [-0.2835, -0.1663, -0.1280],
        [-0.2836, -0.0863, -0.0471],
        [-0.0810,  0.0032, -0.2443],
        [-0.2874, -0.3035,  0.0876],
        [-0.1598, -0.1158, -0.0268],
        [-0.2184, -0.4400,  0.1559],
        [-0.2246, -0.0394, -0.5326]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1800: tensor([[-0.1185, -0.1396,  0.0081],
        [-0.1069, -0.0525, -0.1785],
        [-0.0894, -0.2055, -0.2153],
        [-0.1728,  0.0120, -0.3737],
        [-0.4248, -0.4695,  0.4487],
        [-0.1188,  0.0579, -0.0546],
        [-0.0611, -0.0499, -0.2218],
        [ 0.0343,  0.1123, -0.4694],
        [-0.6829, -0.6874,  0.9311],
        [-0.1167, -0.0784, -0.4982],
        [-0.1843, -0.1697, -0.1446],
        [-0.3174, -0.1671, -0.0251]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1850: tensor([[-0.0599, -0.1664, -0.0624],
        [ 0.1130,  0.1861, -0.5475],
        [-0.3786, -0.5701,  0.5073],
        [-0.4606, -0.1977,  0.1089],
        [-0.3888, -0.4614,  0.5454],
        [-0.1150, -0.0881, -0.2335],
        [-0.1303, -0.1895,  0.0294],
        [-0.2967, -0.2831,  0.3000],
        [-0.1275, -0.1749,  0.0174],
        [-0.0568, -0.0921, -0.1570],
        [-0.0443,  0.2750, -0.6250],
        [-0.2729, -0.3727,  0.4585]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1900: tensor([[-0.2974, -0.2153,  0.1512],
        [-0.4593, -0.7774,  1.2744],
        [ 0.0425, -0.0081, -0.1735],
        [ 0.2361,  0.1784, -0.4226],
        [-0.0269, -0.0315, -0.1255],
        [-0.3683, -0.4510,  0.4404],
        [ 0.1329,  0.0880, -0.4734],
        [-0.0480,  0.0722, -0.4513],
        [ 0.1337,  0.2580, -0.3116],
        [-0.1531,  0.0672, -0.4814],
        [-0.1276, -0.2041,  0.1539],
        [ 0.0273, -0.0361, -0.4091]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1950: tensor([[-0.0819, -0.0677, -0.1442],
        [-0.4128, -0.5233,  0.3261],
        [-0.0079,  0.1067, -0.1947],
        [-0.0735, -0.0093, -0.2415],
        [-0.1567, -0.1901, -0.1071],
        [-0.0511, -0.0230, -0.2878],
        [ 0.0167, -0.1706,  0.1427],
        [-0.1209, -0.0017, -0.2207],
        [-0.1516, -0.1398, -0.2633],
        [-0.3833, -0.2194,  0.0818],
        [ 0.1358,  0.0213, -0.3110],
        [-0.0397,  0.0320, -0.3284]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2000: tensor([[-0.2609, -0.3978, -0.0389],
        [ 0.0800, -0.1158, -0.1791],
        [-0.0223, -0.0594, -0.2621],
        [-0.2195, -0.1391, -0.0482],
        [-0.1614, -0.3449,  0.1642],
        [-0.1084, -0.1222, -0.0598],
        [-0.1277, -0.0961, -0.3191],
        [ 0.0956,  0.0440, -0.0767],
        [-0.1532, -0.2546,  0.0503],
        [ 0.1597,  0.0415, -0.1733],
        [-0.0525,  0.0344, -0.4174],
        [-0.0259, -0.1551, -0.3308]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2050: tensor([[-0.0360, -0.1313, -0.2297],
        [-0.1596, -0.1210, -0.4380],
        [-0.2532, -0.3218,  0.1352],
        [-0.2546, -0.1747, -0.0214],
        [-0.1187, -0.2826, -0.0080],
        [-0.2998, -0.3083,  0.3254],
        [-0.3206, -0.2002, -0.3537],
        [-0.4803, -0.6774,  1.1599],
        [-0.2903, -0.3629, -0.0152],
        [-0.2886, -0.2678, -0.0152],
        [-0.2788, -0.2564, -0.2578],
        [-0.2138, -0.3275, -0.2426]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2100: tensor([[ 0.1178,  0.0797, -0.6616],
        [-0.1567, -0.1808,  0.0278],
        [-0.0677, -0.1832, -0.0857],
        [-0.2776, -0.5456,  0.5847],
        [-0.0487, -0.0687, -0.1953],
        [-0.4716, -0.4702,  0.4454],
        [-0.2303, -0.2807,  0.1784],
        [-0.0046,  0.0040, -0.3335],
        [-0.0697, -0.1900,  0.0752],
        [-0.2673, -0.2231,  0.0866],
        [-0.1064, -0.0473, -0.4399],
        [-0.0333, -0.2210, -0.1301]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2150: tensor([[-0.4296, -0.5049,  0.0919],
        [-0.0964, -0.0314, -0.4145],
        [-0.1467, -0.3615, -0.0171],
        [-0.5392, -0.4828,  0.3784],
        [ 0.0331, -0.1859, -0.1419],
        [-0.1168, -0.1349, -0.2290],
        [ 0.0467, -0.0432, -0.2219],
        [-0.0562, -0.0541, -0.1519],
        [-0.1027, -0.2015, -0.2544],
        [ 0.1590,  0.0746, -0.2705],
        [-0.2350, -0.2846,  0.1637],
        [-0.6741, -0.7645,  1.0102]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2200: tensor([[ 0.0154,  0.0660, -0.3132],
        [-0.5851, -0.5552,  0.6974],
        [-0.3625, -0.2096,  0.0238],
        [-0.1263, -0.1683, -0.2201],
        [-0.1628, -0.1140, -0.4961],
        [ 0.0630,  0.0389, -0.1640],
        [-0.0719, -0.1884, -0.0775],
        [-0.2420, -0.3219, -0.0424],
        [-0.1433, -0.1186, -0.5334],
        [-0.0277, -0.1486, -0.0355],
        [-0.0607, -0.2195, -0.1082],
        [-0.1588, -0.1959, -0.0359]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2250: tensor([[-0.1089, -0.0996, -0.3144],
        [ 0.0722, -0.0396, -0.6459],
        [ 0.0840, -0.0461, -0.0585],
        [-0.0573,  0.0330, -0.2958],
        [ 0.0918,  0.0654, -0.5589],
        [-0.3087, -0.2195, -0.3330],
        [ 0.1788,  0.1820, -0.4119],
        [-0.0646, -0.1134, -0.2550],
        [ 0.0026,  0.0178, -0.7992],
        [-0.0814, -0.1837, -0.0865],
        [ 0.0370,  0.0638, -0.4227],
        [ 0.0035,  0.1727, -0.6122]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2300: tensor([[-0.1624, -0.1197, -0.1761],
        [ 0.0458,  0.0388, -0.5375],
        [-0.3765, -0.4904,  0.1058],
        [-0.3483, -0.2787, -0.2976],
        [-0.3215, -0.4173,  0.0222],
        [-0.1159, -0.0526, -0.1049],
        [-0.2476, -0.3593,  0.3420],
        [ 0.0411, -0.2060,  0.1067],
        [-0.0096, -0.1952,  0.0073],
        [-0.3278, -0.2318,  0.1899],
        [-0.4746, -0.4938,  0.5041],
        [-0.1330, -0.0693, -0.1674]], device='cuda:0', grad_fn=<AddmmBackward>)
