Iter #50: tensor([[-0.3497,  0.4774,  0.1986],
        [ 0.0309,  0.2707,  0.1900],
        [ 0.0207,  0.2948,  0.3999],
        [-0.2540,  0.4082,  0.1358],
        [-0.0009,  0.2101,  0.0114],
        [ 0.1583,  0.2201,  0.2340],
        [ 0.1167,  0.3014,  0.3971],
        [-0.0277,  0.3602,  0.0612],
        [-0.1605,  0.3437,  0.1152],
        [ 0.0341,  0.0519,  0.0473],
        [-0.4401,  0.2051,  0.0191],
        [-0.0573,  0.6291, -0.0345]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #100: tensor([[-0.2623,  0.5262,  0.4046],
        [-0.2467,  0.2571,  0.0864],
        [-0.3248,  0.5454,  0.0234],
        [-0.1884,  0.5111,  0.1867],
        [-0.2982,  0.4396,  0.1702],
        [-0.4154,  0.7532, -0.0237],
        [-0.3385,  0.6300,  0.1472],
        [-0.1599,  0.4074,  0.2768],
        [-0.0286,  0.4876,  0.5005],
        [-0.0881,  0.8351, -0.0069],
        [-0.2062,  0.7961,  0.1122],
        [-0.2280,  0.5348,  0.1577]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #150: tensor([[-0.5489,  0.7107,  0.3032],
        [-0.3746,  0.7073,  0.3550],
        [-0.2940,  0.7299,  0.2155],
        [-0.4957,  0.4588,  0.2792],
        [-0.1966,  0.5114,  0.2905],
        [-0.3290,  0.6664,  0.3365],
        [-0.3214,  0.7623,  0.1643],
        [-0.5738,  0.8698,  0.2023],
        [-0.4206,  0.7489,  0.2270],
        [-0.4358,  0.5756,  0.2830],
        [-0.3657,  0.4023,  0.2897],
        [-0.5737,  0.4735,  0.2730]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #200: tensor([[-0.8050,  1.0051,  0.1362],
        [-0.6795,  0.8923,  0.1386],
        [-0.7653,  0.9415,  0.0956],
        [-0.9182,  0.7919,  0.1326],
        [-0.6306,  0.8675,  0.2786],
        [-0.6581,  0.9456, -0.0150],
        [-0.3029,  0.7861,  0.2304],
        [-0.5682,  0.5773,  0.3500],
        [-0.6404,  0.6716,  0.2050],
        [-0.5315,  0.7747,  0.2238],
        [-0.7309,  0.9215,  0.1231],
        [-0.7118,  0.8903, -0.0197]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #250: tensor([[-0.6136,  0.8764,  0.1972],
        [-0.6558,  0.7068,  0.1734],
        [-0.6008,  0.7956,  0.4185],
        [-0.5356,  0.8937,  0.2999],
        [-0.5685,  0.6405,  0.4752],
        [-0.6538,  1.0262, -0.0049],
        [-0.7231,  0.9363,  0.0588],
        [-0.6495,  0.9654, -0.0986],
        [-0.8301,  1.0937,  0.1094],
        [-0.6192,  0.8896,  0.0449],
        [-0.5200,  0.3818,  0.4844],
        [-0.3608,  0.6376,  0.1306]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #300: tensor([[-0.6321,  0.8124,  0.1794],
        [-0.6873,  1.0241, -0.0868],
        [-0.3599,  0.3791,  0.3269],
        [-0.5840,  0.5337,  0.5794],
        [-0.3993,  0.5381,  0.3017],
        [-0.7906,  0.7770,  0.2128],
        [-0.6126,  0.4269,  0.2118],
        [-0.7529,  0.6741,  0.1537],
        [-0.5599,  0.3675,  0.4647],
        [-0.7211,  0.6409,  0.5225],
        [-0.4745,  0.5747,  0.1681],
        [-0.6260,  0.9243,  0.1961]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #350: tensor([[-0.5282,  0.6982,  0.2711],
        [-0.5488,  0.6960,  0.1803],
        [-0.6837,  0.9721,  0.1617],
        [-0.7126,  0.7009, -0.0238],
        [-0.6185,  0.6279,  0.3406],
        [-0.5911,  0.7316,  0.3758],
        [-0.6667,  0.9882,  0.1483],
        [-0.6178,  0.6846,  0.3150],
        [-0.7176,  0.6382,  0.4886],
        [-0.6260,  0.5882,  0.1551],
        [-0.5983,  0.8582,  0.2695],
        [-0.6628,  0.6956,  0.3336]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #400: tensor([[-0.4926,  0.4966,  0.3529],
        [-0.6354,  0.7926,  0.2290],
        [-0.6357,  0.8714,  0.2283],
        [-0.2126, -0.1498,  0.6326],
        [-0.3152, -0.2659,  0.8686],
        [-0.2190, -0.0741,  0.8094],
        [-0.1570, -0.3175,  1.1491],
        [-0.1430, -0.3010,  1.0290],
        [-0.2556, -0.4572,  0.7834],
        [-0.5667,  0.7906,  0.3018],
        [-0.8941,  0.7062,  0.1613],
        [-0.7024,  0.8614,  0.3493]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #450: tensor([[-0.6632,  0.8712,  0.1723],
        [-0.5024,  0.4840,  0.2873],
        [-0.5195,  0.5122,  0.2236],
        [-0.5449,  0.5652,  0.1513],
        [-0.4504,  0.8303,  0.0792],
        [-0.5471,  0.9638, -0.0544],
        [-0.5508,  0.9023, -0.0089],
        [-0.6646,  0.5653,  0.2454],
        [-0.6408,  0.5178,  0.3577],
        [-0.5867,  0.7781, -0.0604],
        [-0.5006,  0.4407,  0.3086],
        [-0.7203,  0.5402,  0.2944]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #500: tensor([[-0.6025,  0.6249,  0.2877],
        [-0.3581,  0.7250,  0.1110],
        [-0.5833,  0.7794,  0.2304],
        [-0.3616,  0.4371,  0.3535],
        [-0.6034,  0.7662,  0.3164],
        [-0.5633,  0.4128,  0.1417],
        [-0.7006,  0.7715,  0.2206],
        [-0.5337,  0.7417,  0.0321],
        [-0.7297,  0.9032,  0.2268],
        [-0.2912, -0.2924,  0.4382],
        [-0.6471,  0.4559,  0.3667],
        [-0.5154,  0.5860,  0.1664]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #550: tensor([[-0.3045,  0.4125,  0.3808],
        [-0.3998,  0.4511,  0.2993],
        [-0.2925, -0.0876,  0.5139],
        [-0.4932, -0.0215,  0.6326],
        [-0.2491,  0.1052,  0.6871],
        [-0.6592,  0.3861,  0.2159],
        [-0.7287,  0.7027,  0.2464],
        [-0.5321,  0.7297,  0.3582],
        [-0.5311,  0.3257,  0.4297],
        [-0.3895,  0.0504,  0.6718],
        [-0.5237,  0.7738,  0.2658],
        [-0.6310,  0.6225,  0.3902]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #600: tensor([[-0.1467, -0.1826,  0.9047],
        [-0.6101,  0.3750,  0.3749],
        [-0.6770,  0.7008,  0.1822],
        [-0.4683,  0.2015,  0.6944],
        [-0.2602, -0.2371,  0.8849],
        [-0.2664,  0.3175,  0.5543],
        [-0.4691,  0.2727,  0.5627],
        [-0.2692,  0.2523,  0.5052],
        [-0.1607, -0.1362,  0.8972],
        [-0.2515,  0.5157,  0.0732],
        [-0.2265, -0.3060,  0.8424],
        [-0.4083,  0.0762,  0.5958]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #650: tensor([[-0.2961,  0.4893,  0.2180],
        [-0.4884,  0.5898,  0.1054],
        [-0.4552,  0.6231,  0.1310],
        [-0.4864,  0.6064,  0.2165],
        [-0.2973, -0.0375,  0.6701],
        [-0.1492, -0.4638,  1.0241],
        [-0.2432,  0.2501,  0.8503],
        [-0.3551,  0.1370,  0.4717],
        [-0.3301,  0.0797,  0.6518],
        [-0.3789,  0.2567,  0.4953],
        [-0.3674,  0.6252,  0.0338],
        [-0.3767,  0.4253,  0.3624]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #700: tensor([[-0.4699,  0.2409,  0.2851],
        [-0.3347,  0.3516,  0.2999],
        [-0.2991,  0.2405,  0.3229],
        [-0.3588,  0.7991, -0.0890],
        [-0.4192,  0.4674,  0.3685],
        [-0.3705,  0.5009,  0.0917],
        [-0.2563,  0.0320,  0.4254],
        [-0.3350,  0.0337,  0.4137],
        [-0.3452,  0.2046,  0.2862],
        [-0.3902,  0.4349,  0.3450],
        [-0.2822,  0.3577,  0.3720],
        [-0.1959, -0.1992,  0.8582]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #750: tensor([[ 0.0079, -0.8589,  1.1661],
        [-0.1413, -0.4546,  0.9171],
        [ 0.0284, -0.6222,  1.1418],
        [-0.5108,  0.2118,  0.2888],
        [-0.3531,  0.0447,  0.4788],
        [-0.3212,  0.0080,  0.4633],
        [-0.3050,  0.3846,  0.1219],
        [-0.3744,  0.4950,  0.1439],
        [-0.1778,  0.2611,  0.4401],
        [-0.5807,  0.1798,  0.3855],
        [-0.0456, -0.1991,  0.8102],
        [-0.2813,  0.3889,  0.2699]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #800: tensor([[-0.4023,  0.5382,  0.0296],
        [-0.5345,  0.4191,  0.0582],
        [-0.3953,  0.5267,  0.1843],
        [-0.4712,  0.8358, -0.0468],
        [-0.4973,  0.6805,  0.1510],
        [-0.5249,  0.7027,  0.0662],
        [-0.5181,  0.5833, -0.1042],
        [-0.3772,  0.2309, -0.0895],
        [-0.2409,  0.1950,  0.2853],
        [-0.4462,  0.5387,  0.1559],
        [-0.1761,  0.0885,  0.5811],
        [-0.2156,  0.1806,  0.4548]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #850: tensor([[-0.2644,  0.1739,  0.3370],
        [-0.1965,  0.4155,  0.3024],
        [-0.3947,  0.7768, -0.1947],
        [-0.3423,  0.4953,  0.0634],
        [-0.3001,  0.1697,  0.3613],
        [-0.3546,  0.2713,  0.2423],
        [-0.2634,  0.6823,  0.1360],
        [-0.2684, -0.0156,  0.3652],
        [-0.1976, -0.0743,  0.3550],
        [-0.2309, -0.2081,  0.8431],
        [-0.1543, -0.0580,  0.3904],
        [-0.2087,  0.2522,  0.3727]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #900: tensor([[-0.3212,  0.6399, -0.2039],
        [-0.1802,  0.2680,  0.1480],
        [-0.2045,  0.4115,  0.1660],
        [-0.1548,  0.0858,  0.4446],
        [-0.4326,  0.3549,  0.1276],
        [-0.1177,  0.3568, -0.0095],
        [-0.3639,  0.5642, -0.0840],
        [-0.1807,  0.4864,  0.1367],
        [-0.1561,  0.3550,  0.1541],
        [-0.4716,  0.2879, -0.0651],
        [-0.2331,  0.3772,  0.1254],
        [-0.3095, -0.1875,  0.4255]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #950: tensor([[-0.2495,  0.2711,  0.2019],
        [-0.3588,  0.2541,  0.2941],
        [-0.3487,  0.4213, -0.0839],
        [-0.4098,  0.4796, -0.1125],
        [-0.3921,  0.0770,  0.3630],
        [-0.1466, -0.0760,  0.4224],
        [-0.3920,  0.3339,  0.0920],
        [-0.2711,  0.6989, -0.1741],
        [-0.1570,  0.4629,  0.1219],
        [ 0.0632, -0.0608,  0.2870],
        [-0.1988,  0.3699, -0.1311],
        [-0.3687,  0.4808,  0.2828]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1000: tensor([[-0.3220,  0.3994,  0.0697],
        [-0.3379,  0.0835,  0.1819],
        [-0.2373,  0.7608, -0.1441],
        [-0.2613,  0.3474,  0.1774],
        [-0.3445,  0.4891, -0.2740],
        [-0.1574,  0.2944, -0.0784],
        [-0.1982,  0.4675, -0.0779],
        [-0.2629,  0.1826,  0.2908],
        [-0.3613,  0.4482, -0.1150],
        [-0.1267,  0.4758,  0.3669],
        [-0.2318,  0.5116, -0.0381],
        [-0.1549, -0.0263,  0.3873]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1050: tensor([[-0.2628,  0.3030, -0.0145],
        [ 0.0683,  0.1321,  0.2214],
        [-0.1007,  0.2664, -0.0139],
        [-0.2297, -0.0287,  0.3770],
        [ 0.1289, -0.5821,  0.8722],
        [-0.0047, -0.8461,  1.0322],
        [-0.0796, -0.6202,  0.8678],
        [-0.0161, -0.4371,  0.6161],
        [ 0.0464, -0.1571,  0.4796],
        [-0.2264,  0.0655,  0.4004],
        [-0.1392,  0.1682,  0.3600],
        [-0.2419,  0.7750, -0.3904]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1100: tensor([[-0.1308, -0.0354,  0.3472],
        [-0.0813,  0.0863,  0.2599],
        [-0.0650, -0.5540,  0.5659],
        [ 0.0110,  0.1897,  0.3502],
        [-0.0146, -0.3810,  0.6929],
        [-0.0532,  0.1595,  0.1368],
        [-0.1342,  0.2023,  0.0822],
        [-0.0168,  0.3508,  0.2061],
        [-0.2770,  0.3158, -0.1065],
        [ 0.0460, -0.2908,  0.3637],
        [-0.0835, -0.3180,  0.6212],
        [-0.2717, -0.1223,  0.0722]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1150: tensor([[-0.3951,  0.6822, -0.2955],
        [-0.2845,  0.4897, -0.3481],
        [-0.1125,  0.1227,  0.2398],
        [ 0.0086, -0.0570,  0.6034],
        [-0.0395,  0.2546,  0.2057],
        [-0.1744,  0.8526, -0.6260],
        [-0.2468,  0.2571, -0.0230],
        [-0.2069,  0.1019,  0.1584],
        [-0.1934,  0.5270, -0.4343],
        [-0.0073,  0.1532,  0.2376],
        [-0.2100,  0.3351, -0.0343],
        [-0.2042,  0.2432,  0.2381]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1200: tensor([[ 0.1374,  0.0251,  0.2667],
        [-0.0773,  0.2027, -0.0009],
        [-0.0560,  0.0417,  0.1412],
        [-0.1311,  0.2937,  0.1507],
        [-0.0949,  0.4350, -0.1469],
        [-0.2583,  0.3224, -0.3402],
        [ 0.0842, -0.1660,  0.2141],
        [-0.0385,  0.0178,  0.1480],
        [ 0.0101,  0.2379,  0.1545],
        [-0.2106,  0.1412,  0.0089],
        [-0.1501,  0.1603,  0.1800],
        [-0.0687,  0.3190, -0.1610]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1250: tensor([[-0.0514,  0.0602, -0.0805],
        [-0.1565,  0.5260, -0.1050],
        [-0.2375,  0.5210, -0.2087],
        [-0.0138, -0.0583,  0.5588],
        [-0.0887,  0.5035, -0.2827],
        [ 0.0461, -0.0516,  0.3813],
        [-0.0668,  0.0519,  0.1206],
        [ 0.0719,  0.5642, -0.2402],
        [ 0.1197, -0.5798,  0.8601],
        [ 0.0933,  0.2840, -0.0462],
        [-0.0426, -0.0240,  0.2531],
        [-0.1557,  0.2165,  0.0610]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1300: tensor([[ 0.1368,  0.0776,  0.4513],
        [ 0.0549, -0.6407,  0.7126],
        [-0.0511,  0.1508,  0.0467],
        [ 0.1153, -0.4776,  0.6402],
        [ 0.0297, -0.1102,  0.2751],
        [-0.0169, -0.0392,  0.4676],
        [ 0.0067,  0.2550,  0.1152],
        [-0.0563, -0.0127,  0.0588],
        [ 0.2139,  0.2770,  0.0018],
        [-0.1042, -0.3707,  0.4451],
        [ 0.1786,  0.2492, -0.0962],
        [ 0.2160, -0.1425,  0.5941]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1350: tensor([[-0.1613,  0.3169, -0.2739],
        [ 0.0171,  0.6080, -0.3220],
        [-0.1367,  0.4315, -0.1422],
        [-0.1905,  0.2025, -0.1635],
        [-0.0896,  0.0716, -0.1350],
        [-0.0859,  0.3930, -0.3503],
        [ 0.0353,  0.6880, -0.4283],
        [ 0.0908,  0.1824, -0.4024],
        [ 0.0104,  0.3640,  0.0302],
        [-0.1297,  0.4567, -0.2249],
        [-0.2293,  0.6580, -0.2775],
        [-0.1668,  0.2987, -0.1955]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1400: tensor([[-0.3174,  0.6726, -0.5618],
        [ 0.0430,  0.1716, -0.0019],
        [-0.1050,  0.1247, -0.1415],
        [ 0.1159,  0.1964, -0.0805],
        [-0.0325,  0.1643, -0.3641],
        [-0.0649,  0.1464, -0.3820],
        [ 0.1505, -0.1697,  0.0821],
        [ 0.0807,  0.1670, -0.0938],
        [-0.0649, -0.0052,  0.0329],
        [ 0.1281,  0.0408, -0.1410],
        [-0.0896,  0.0699, -0.1639],
        [-0.0290,  0.1973, -0.1049]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1450: tensor([[-0.1190,  0.5791, -0.7684],
        [ 0.0570,  0.2051, -0.3307],
        [-0.0821,  0.5656, -0.5091],
        [ 0.1110,  0.5791, -0.4668],
        [ 0.1746,  0.5291, -0.3882],
        [-0.0686,  0.6470, -0.3138],
        [-0.0736,  0.4089, -0.4202],
        [-0.1105,  0.5083, -0.5348],
        [-0.1971,  0.5684, -0.4876],
        [-0.3665,  0.5604, -0.5029],
        [ 0.1491,  0.4706, -0.2929],
        [ 0.0495,  0.4845, -0.2628]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1500: tensor([[-0.1982,  1.1308, -0.6297],
        [-0.1762,  0.5467, -0.4634],
        [-0.1189,  0.6835, -0.6065],
        [-0.0755,  0.6693, -0.5250],
        [-0.1822,  1.0588, -0.6740],
        [-0.2983,  0.7132, -0.7791],
        [-0.2045,  0.5426, -0.6679],
        [ 0.0491,  0.3668, -0.2939],
        [-0.1301,  0.5840, -0.4420],
        [-0.1653,  0.9455, -0.5721],
        [ 0.0640,  0.5861, -0.5080],
        [-0.2790,  0.7823, -0.6347]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1550: tensor([[ 0.1380,  0.0164, -0.2779],
        [ 0.0098,  0.6820, -0.6054],
        [ 0.0984,  0.1258, -0.5164],
        [ 0.4181,  0.1698, -0.1552],
        [ 0.1076,  0.3794, -0.4570],
        [ 0.0039,  0.5423, -0.4932],
        [ 0.1046,  0.2257, -0.4633],
        [ 0.1006,  0.2329, -0.2534],
        [ 0.1023,  0.3689, -0.3227],
        [ 0.1562,  0.1678, -0.3121],
        [-0.0444,  0.5202, -0.4939],
        [-0.0236,  0.3822, -0.5563]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1600: tensor([[-0.0163,  0.4228, -0.2929],
        [ 0.6402, -0.8472,  0.2814],
        [ 0.3266, -0.0372, -0.3113],
        [ 0.7424, -0.7618,  0.2726],
        [ 0.1371,  0.0892, -0.2519],
        [ 0.3737, -0.3277,  0.0408],
        [ 0.0950,  0.5671, -0.4548],
        [ 0.3530,  0.1902, -0.2464],
        [ 0.1011,  0.0537, -0.4032],
        [ 0.3106,  0.1184, -0.2026],
        [ 0.6747, -1.1238,  0.3000],
        [ 0.2979, -0.2037, -0.1654]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1650: tensor([[ 0.6463, -1.1376,  0.8682],
        [ 0.2636, -0.0071, -0.3149],
        [ 0.3340,  0.1492, -0.3250],
        [ 0.4170,  0.0548, -0.3390],
        [ 0.0848,  0.5122, -0.3245],
        [ 0.1102,  0.6574, -0.5077],
        [ 0.1348,  0.7095, -0.6310],
        [-0.0898,  0.4964, -0.8696],
        [ 0.2767,  0.3908, -0.4895],
        [ 0.1456,  0.4967, -0.3981],
        [ 0.0110,  0.3069, -0.4758],
        [ 0.3039,  0.0444, -0.4440]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1700: tensor([[ 0.1459,  0.8933, -0.6541],
        [ 0.1536,  0.6186, -0.8154],
        [ 0.3239,  0.3540, -0.4427],
        [ 0.1578,  0.3334, -0.6746],
        [ 0.2675,  0.4605, -0.5077],
        [ 0.0157,  0.9945, -0.7359],
        [-0.1548,  0.8715, -0.9198],
        [-0.0965,  0.8463, -0.8274],
        [ 0.6679, -0.9020,  0.7265],
        [ 0.5154, -0.4134,  0.1633],
        [ 0.4193, -0.1670,  0.0014],
        [ 0.0065,  0.1192, -0.3148]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1750: tensor([[-0.2088,  1.0083, -0.7313],
        [ 0.0720,  0.7686, -0.6353],
        [ 0.0553,  0.4547, -0.6607],
        [ 0.1082,  0.4931, -0.5480],
        [-0.0996,  0.7147, -0.9058],
        [-0.0832,  0.8256, -0.8135],
        [ 0.0806,  0.7255, -0.8682],
        [ 0.1048,  0.6894, -0.6852],
        [-0.0637,  0.4188, -0.6852],
        [ 0.2086,  0.3740, -0.5893],
        [ 0.2218,  0.8226, -0.6881],
        [-0.0845,  0.6906, -0.6431]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1800: tensor([[ 0.2066,  0.4250, -0.5413],
        [ 0.1924,  0.7037, -0.7231],
        [ 0.2568,  0.5086, -0.7294],
        [ 0.0737,  0.7987, -0.6219],
        [ 0.2148,  0.8004, -0.7904],
        [ 0.3005,  0.3870, -0.6454],
        [ 0.2663,  0.1922, -0.5614],
        [ 0.3490,  0.2971, -0.3990],
        [ 0.0167,  0.7196, -0.8239],
        [ 0.2165,  0.4822, -0.7333],
        [ 0.1353,  0.5498, -0.6925],
        [ 0.0219,  0.6320, -0.6558]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1850: tensor([[ 0.0901,  0.5317, -0.6620],
        [ 0.3252,  0.1917, -0.5548],
        [ 0.0236,  0.6355, -0.7553],
        [ 0.1375,  0.4744, -0.6428],
        [ 0.3942,  0.4289, -0.5739],
        [ 0.1682,  0.7069, -0.3124],
        [ 0.1492,  0.5926, -0.7278],
        [ 0.1245,  0.5071, -0.3932],
        [ 0.4379,  0.0819, -0.2133],
        [ 0.2611,  0.1109, -0.3046],
        [ 0.4778,  0.1288, -0.1236],
        [ 0.0714,  0.6137, -0.7169]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1900: tensor([[ 0.2113,  0.1652, -0.3332],
        [ 0.1566,  0.6128, -0.6483],
        [ 0.1091,  0.7036, -0.4548],
        [ 0.2003,  0.1910, -0.3190],
        [ 0.6743, -1.2768,  0.8283],
        [ 0.3190,  0.0769, -0.4171],
        [ 0.3037,  0.4372, -0.6353],
        [ 0.4350, -0.5152, -0.1360],
        [ 0.2681,  0.3629, -0.4991],
        [ 0.1753,  0.1634, -0.5536],
        [ 0.2728,  0.2540, -0.5086],
        [ 0.1862,  0.1734, -0.4336]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #1950: tensor([[ 0.0505,  0.1473, -0.4185],
        [ 0.2368,  0.5800, -0.4808],
        [ 0.3545,  0.1860, -0.1843],
        [ 0.1710,  0.5065, -0.4851],
        [ 0.0139,  0.5335, -0.9548],
        [-0.0451,  0.4423, -0.6311],
        [ 0.3038,  0.1025, -0.4011],
        [ 0.3185,  0.3973, -0.1847],
        [ 0.2864,  0.2052, -0.3589],
        [ 0.1913,  0.3976, -0.5152],
        [ 0.0717,  0.5060, -0.4993],
        [ 0.0426,  0.7896, -0.4939]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2000: tensor([[ 0.1302,  0.0815, -0.5830],
        [ 0.4845, -0.3040,  0.0268],
        [ 0.6547, -0.9717,  0.2755],
        [ 0.3339, -0.3647,  0.2149],
        [ 0.1732,  0.2918, -0.4817],
        [ 0.2097,  0.3653, -0.5279],
        [ 0.0765,  0.4663, -0.4778],
        [ 0.1487,  0.6204, -0.5605],
        [ 0.0812,  0.3399, -0.5996],
        [ 0.0126,  0.5080, -0.5337],
        [ 0.2231,  0.4152, -0.6137],
        [ 0.0772,  0.6868, -0.4297]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2050: tensor([[ 0.2280,  0.5663, -0.4471],
        [ 0.2316,  0.3172, -0.3247],
        [ 0.1634,  0.1026, -0.3109],
        [ 0.3618, -0.3537, -0.1016],
        [ 0.0133,  0.6079, -0.3498],
        [ 0.0512,  0.5271, -0.4776],
        [-0.0018,  0.6378, -0.6209],
        [-0.0168,  0.6136, -0.5109],
        [-0.0019,  0.5237, -0.5123],
        [-0.1606,  0.6169, -0.6535],
        [-0.0159,  0.5857, -0.5914],
        [ 0.0280,  0.5966, -0.6707]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2100: tensor([[ 0.1280,  0.0205, -0.3569],
        [-0.1231,  0.5594, -0.6721],
        [ 0.1843, -0.1430, -0.3177],
        [ 0.1505,  0.3405, -0.5061],
        [ 0.2289,  0.3682, -0.4629],
        [ 0.2876,  0.0713, -0.2363],
        [ 0.2154,  0.3917, -0.3971],
        [ 0.2445,  0.0504, -0.2319],
        [ 0.3994, -0.3963, -0.0009],
        [ 0.5930, -0.7543,  0.0675],
        [-0.0151,  0.2195, -0.3350],
        [ 0.1235,  0.3364, -0.3754]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2150: tensor([[ 0.1152,  0.1679, -0.2740],
        [ 0.2967,  0.0380, -0.3208],
        [ 0.2558,  0.1469, -0.2061],
        [ 0.2808,  0.2302, -0.3215],
        [ 0.2330,  0.4185, -0.3655],
        [ 0.1111,  0.3878, -0.5372],
        [ 0.0660,  0.4945, -0.5520],
        [ 0.2159,  0.2150, -0.3078],
        [ 0.1736,  0.2113, -0.3463],
        [ 0.0662,  0.4391, -0.3973],
        [ 0.1075,  0.3040, -0.4896],
        [ 0.1361,  0.5923, -0.4409]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2200: tensor([[ 0.2048,  0.4477, -0.4402],
        [ 0.0541,  0.2420, -0.4315],
        [ 0.1718,  0.1214, -0.2569],
        [ 0.4006,  0.2371, -0.2461],
        [ 0.0866,  0.2106, -0.3780],
        [ 0.3943,  0.1280, -0.2115],
        [-0.0054,  0.1166, -0.2247],
        [ 0.0470,  0.2218, -0.5118],
        [ 0.1535,  0.1355, -0.3243],
        [ 0.2977, -0.1892, -0.1544],
        [ 0.0669,  0.0726, -0.3160],
        [ 0.4119,  0.0689, -0.2118]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2250: tensor([[ 0.0444,  0.0731, -0.4520],
        [-0.0010,  0.3727, -0.2756],
        [-0.0069,  0.2639, -0.2871],
        [ 0.3137, -0.0736, -0.1651],
        [ 0.1151,  0.4100, -0.3566],
        [ 0.0300,  0.4147, -0.5580],
        [ 0.0483,  0.3959, -0.3627],
        [ 0.0522,  0.1664, -0.3823],
        [-0.0268,  0.4207, -0.4070],
        [ 0.1342,  0.6788, -0.2455],
        [-0.0612,  0.6053, -0.5034],
        [ 0.1686,  0.2629, -0.2748]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2300: tensor([[-0.1922,  0.6813, -0.5041],
        [-0.3120,  0.8091, -0.4261],
        [-0.2405,  0.9284, -0.3508],
        [-0.2079,  0.7108, -0.3310],
        [-0.0437,  0.2948, -0.3457],
        [-0.2553,  0.5240, -0.3326],
        [-0.5380,  0.8694, -0.4559],
        [-0.2308,  0.9373, -0.3973],
        [-0.3407,  0.5829, -0.4047],
        [-0.1872,  0.8233, -0.4562],
        [-0.1802,  0.8549, -0.4839],
        [-0.2091,  0.6996, -0.4019]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2350: tensor([[ 0.1629,  0.3695, -0.2200],
        [ 0.3279,  0.1843, -0.2482],
        [ 0.2367,  0.3238, -0.1719],
        [ 0.1314,  0.4008, -0.1641],
        [ 0.4154, -0.0028, -0.2062],
        [ 0.0906,  0.2943, -0.1743],
        [ 0.2888, -0.0289, -0.3278],
        [ 0.1528,  0.2189, -0.3044],
        [ 0.0418,  0.5391, -0.3080],
        [ 0.2206,  0.1807, -0.1709],
        [ 0.3854,  0.0077, -0.2276],
        [ 0.2116,  0.1847, -0.1203]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2400: tensor([[-0.4201,  0.7743, -0.0374],
        [-0.5461,  0.9221, -0.2266],
        [-0.6535,  1.1004, -0.1092],
        [-0.4128,  0.9052, -0.1789],
        [-0.4223,  0.8008, -0.2233],
        [-0.2443,  0.8484, -0.1863],
        [-0.4364,  0.7452, -0.0156],
        [-0.4661,  0.4999, -0.3817],
        [-0.4635,  1.0090, -0.2998],
        [-0.7560,  0.9597, -0.2313],
        [-0.2327,  0.8605,  0.0777],
        [-0.6560,  0.8019, -0.2913]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2450: tensor([[-0.1698,  0.3661, -0.1327],
        [-0.2060,  0.4894, -0.0756],
        [-0.3045,  0.6262, -0.1187],
        [-0.2587,  0.5855, -0.0596],
        [-0.4943,  0.4479, -0.2745],
        [-0.1606,  0.6155, -0.0761],
        [-0.1930,  0.4585, -0.0772],
        [-0.0071,  0.3690, -0.0937],
        [-0.2184,  0.5360, -0.0717],
        [-0.1871,  0.3960, -0.0579],
        [-0.1766,  0.3454, -0.0806],
        [-0.2768,  0.5042, -0.3045]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2500: tensor([[-0.1793,  0.3660, -0.0086],
        [-0.1283,  0.2246, -0.2171],
        [-0.0783,  0.4268, -0.0872],
        [-0.0755,  0.0572, -0.2874],
        [-0.0218,  0.3680,  0.0335],
        [-0.3286,  0.4717,  0.0418],
        [-0.0504,  0.3551, -0.0975],
        [-0.1543,  0.4454, -0.0068],
        [ 0.1935,  0.1886, -0.0227],
        [-0.0009,  0.2710, -0.1266],
        [ 0.0496, -0.0200, -0.1123],
        [-0.0855,  0.2285,  0.0179]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2550: tensor([[-0.3255,  0.4047, -0.0682],
        [ 0.0462,  0.4312, -0.0224],
        [-0.1587,  0.5842, -0.0372],
        [-0.2374,  0.4635,  0.0479],
        [ 0.0158,  0.3013, -0.1051],
        [ 0.1244,  0.2042, -0.0294],
        [-0.1457,  0.2739,  0.0196],
        [ 0.0592,  0.4175, -0.0058],
        [ 0.0575,  0.3759,  0.1090],
        [-0.1702,  0.5017, -0.0932],
        [ 0.0214,  0.2851, -0.1177],
        [-0.0451,  0.1193, -0.0691]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2600: tensor([[ 1.0141e-02,  3.1201e-01, -6.9958e-02],
        [-8.2327e-02,  3.6849e-01, -8.2302e-02],
        [-2.9769e-02,  4.2268e-01,  6.7525e-02],
        [ 1.4986e-02,  2.8602e-01, -1.0115e-02],
        [ 9.6859e-05,  3.4165e-01, -1.4117e-01],
        [-1.6494e-01,  1.4770e-01, -9.3785e-02],
        [ 1.7819e-01,  1.4358e-01, -8.1900e-02],
        [ 4.1288e-02,  2.7895e-01,  5.9463e-02],
        [-5.4791e-02,  3.8028e-01, -2.8529e-02],
        [ 4.6970e-02,  1.5080e-01,  1.8746e-01],
        [-5.2241e-02, -4.5120e-02,  5.1844e-02],
        [ 1.1370e-01, -1.2187e-01, -1.3225e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
Iter #2650: tensor([[-0.0665,  0.1460, -0.1266],
        [-0.0812,  0.3029, -0.1205],
        [-0.0246,  0.2772, -0.0462],
        [-0.0883,  0.2616, -0.1436],
        [-0.2839,  0.4864, -0.1033],
        [ 0.1547,  0.1232,  0.0382],
        [-0.3283,  0.3800, -0.2175],
        [-0.1645,  0.4040, -0.0251],
        [-0.1155,  0.4142, -0.1063],
        [-0.1358,  0.6315,  0.0286],
        [-0.2199,  0.2189, -0.1302],
        [-0.0939,  0.2423,  0.0895]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2700: tensor([[-0.0196,  0.0912,  0.0444],
        [-0.2678,  0.4098,  0.0326],
        [-0.1847,  0.3929, -0.1022],
        [-0.4220,  0.4012, -0.3166],
        [ 0.3740, -0.2725,  0.0437],
        [-0.3389,  0.4519, -0.0782],
        [-0.1768,  0.3793,  0.0135],
        [ 0.0486,  0.0489,  0.1430],
        [-0.0246,  0.1604, -0.1474],
        [ 0.1911,  0.0135,  0.1105],
        [-0.3802,  0.5845, -0.0713],
        [-0.2652,  0.5699, -0.0343]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2750: tensor([[-0.0292,  0.3533,  0.0890],
        [ 0.1455,  0.3490, -0.0610],
        [-0.0910,  0.2044, -0.0494],
        [-0.1222,  0.3922, -0.1152],
        [ 0.0450,  0.1491,  0.0595],
        [-0.1341,  0.3972,  0.0631],
        [ 0.0440,  0.2327,  0.0381],
        [-0.0645,  0.2556,  0.1059],
        [ 0.1275,  0.0932,  0.0292],
        [ 0.2232, -0.1390, -0.0338],
        [ 0.1213,  0.1819,  0.0922],
        [ 0.2164,  0.0608,  0.0805]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2800: tensor([[-0.1185,  0.2351,  0.0854],
        [-0.0966,  0.3548,  0.0536],
        [-0.1461,  0.2632, -0.2575],
        [-0.0774,  0.2892,  0.1504],
        [-0.1065,  0.1999,  0.1261],
        [ 0.0561, -0.0599,  0.1027],
        [-0.0997,  0.3630,  0.0048],
        [-0.3067,  0.3196, -0.0146],
        [ 0.1622,  0.1266,  0.1533],
        [-0.1385,  0.3960,  0.0839],
        [-0.1935,  0.2648, -0.1517],
        [-0.0920,  0.2840,  0.0443]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2850: tensor([[-0.0570,  0.4502,  0.0437],
        [-0.1808,  0.3293,  0.0073],
        [ 0.0355,  0.0272,  0.0685],
        [ 0.0632,  0.3547,  0.0529],
        [-0.4661,  0.4540, -0.0321],
        [-0.0750,  0.1855,  0.0781],
        [ 1.1791, -1.2455,  0.1003],
        [-0.1549,  0.1928,  0.0028],
        [-0.1230,  0.2717, -0.0547],
        [-0.1581,  0.2622,  0.1030],
        [-0.0349,  0.3536,  0.0097],
        [-0.0414,  0.0041, -0.0502]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2900: tensor([[-0.2212,  0.3912,  0.1109],
        [-0.3358,  0.5394, -0.0415],
        [-0.3293,  0.5831,  0.0165],
        [-0.1465,  0.4091, -0.0489],
        [-0.2562,  0.1568, -0.0179],
        [-0.2104,  0.5809, -0.0745],
        [ 1.1884, -1.4753,  0.2955],
        [ 0.0176,  0.0587,  0.0995],
        [ 1.2752, -1.5245,  0.2925],
        [ 0.0139,  0.3290,  0.1263],
        [ 0.1903,  0.0891, -0.2120],
        [ 0.0821, -0.0020, -0.0933]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #2950: tensor([[ 1.1693, -1.5222,  0.3982],
        [ 0.0424,  0.2223,  0.0334],
        [-0.0560,  0.0613,  0.1081],
        [-0.1000,  0.2523,  0.1352],
        [-0.2053,  0.1257, -0.0192],
        [-0.1906,  0.4513, -0.0260],
        [-0.0317,  0.3812, -0.0414],
        [-0.0206,  0.2984,  0.0698],
        [-0.1149,  0.4355, -0.0652],
        [ 0.0325,  0.2301, -0.0738],
        [ 0.0038,  0.2164,  0.0912],
        [-0.1620,  0.3569, -0.0160]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3000: tensor([[-0.0810, -0.0472, -0.1475],
        [ 0.0385, -0.0318,  0.0905],
        [-0.0556,  0.2061,  0.1682],
        [-0.0882,  0.0705,  0.2403],
        [-0.1757,  0.5944,  0.0443],
        [-0.1458,  0.2543,  0.0720],
        [-0.3826,  0.3826, -0.1787],
        [ 0.1721, -0.0452,  0.0437],
        [-0.2367,  0.2724, -0.0326],
        [-0.0281,  0.1969,  0.1011],
        [-0.1035,  0.2443, -0.0245],
        [-0.1905,  0.5234,  0.1238]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3050: tensor([[-0.0962,  0.0901,  0.1014],
        [ 0.9479, -1.4411,  0.3141],
        [-0.0852,  0.2272, -0.0688],
        [-0.2555,  0.3843, -0.0800],
        [-0.2151,  0.1256,  0.0512],
        [-0.1382,  0.1115,  0.0790],
        [-0.2477,  0.2305,  0.0302],
        [ 0.1128,  0.2238,  0.0479],
        [-0.2863,  0.3651, -0.0656],
        [-0.1673,  0.0612,  0.0807],
        [-0.2032,  0.0356, -0.0652],
        [-0.0245,  0.2519,  0.1029]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3100: tensor([[-0.1974,  0.1824,  0.0013],
        [-0.1405,  0.3277,  0.0322],
        [-0.3338,  0.3945, -0.0422],
        [-0.0409,  0.4207,  0.0151],
        [-0.0380,  0.2597,  0.0753],
        [-0.0652,  0.2643,  0.0611],
        [ 0.0570,  0.2457,  0.1440],
        [ 0.0246,  0.3490,  0.1545],
        [-0.0728,  0.3777, -0.0204],
        [-0.2184,  0.3110,  0.0108],
        [-0.2720,  0.2597,  0.0771],
        [-0.0971,  0.4837,  0.1596]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3150: tensor([[-0.2776,  0.2501,  0.0314],
        [-0.0370,  0.1978,  0.1275],
        [-0.3303,  0.3104,  0.1082],
        [-0.3523,  0.3436, -0.0014],
        [-0.0897,  0.1697,  0.2284],
        [-0.2385,  0.2545,  0.0704],
        [-0.1574,  0.0104,  0.1370],
        [-0.1862,  0.3411,  0.0833],
        [ 0.0403, -0.0255, -0.0595],
        [-0.0458,  0.3526,  0.1026],
        [ 0.0671, -0.0125,  0.2791],
        [-0.2973,  0.4519,  0.0430]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3200: tensor([[-0.0700,  0.2413,  0.0784],
        [-0.2739,  0.4842, -0.0544],
        [-0.2997,  0.3767, -0.0042],
        [-0.0538,  0.3265,  0.0462],
        [-0.0865,  0.2148,  0.0523],
        [-0.1669,  0.1129, -0.0183],
        [-0.0109, -0.0694,  0.1455],
        [-0.0099,  0.1297,  0.1508],
        [-0.2803,  0.2413, -0.0836],
        [ 0.1502, -0.0245,  0.3203],
        [-0.1837,  0.2874,  0.0079],
        [-0.2979,  0.4307, -0.0507]], device='cuda:0', grad_fn=<AddmmBackward>)
Iter #3250: tensor([[-1.4620e-01,  3.5273e-01,  1.7314e-01],
        [-1.5620e-01,  1.8414e-01,  1.1915e-01],
        [-4.7222e-02,  1.3292e-01,  1.4373e-01],
        [-4.1344e-01,  4.8517e-01, -1.5962e-02],
        [ 2.0405e-01,  8.7842e-02,  2.1125e-01],
        [-1.8256e-01,  2.8398e-01, -5.6135e-02],
        [-7.2382e-02,  5.1179e-01,  5.0394e-02],
        [-1.2045e-01,  5.1616e-01,  9.1994e-02],
        [-2.7322e-01,  4.4569e-01,  6.2586e-03],
        [ 7.2929e-04,  1.2975e-01,  1.0107e-01],
        [-1.1454e-01,  3.3103e-01,  1.3108e-01],
        [ 5.1089e-04,  1.8208e-01,  3.0181e-01]], device='cuda:0',
       grad_fn=<AddmmBackward>)
